diff --git "a/perplexity2575/3491175.out" "b/perplexity2575/3491175.out" new file mode 100644--- /dev/null +++ "b/perplexity2575/3491175.out" @@ -0,0 +1,40510 @@ +Model parameters: d_model 2560 ffw_size 10240 kv_size 128 n_heads 20 n_layers 34 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 2 --pipeline-model-parallel-size 1 --num-layers 34 --hidden-size 2560 --num-attention-heads 20 --kv-channels 128 --ffn-hidden-size 10240 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 2 --global-batch-size 1024 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-4b284b84bperplexity2575val --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 1000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_4b284b84bperplexity2575val --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-4b2-84b-c4-perplexity/perplexity2575 --load lm1-4b2-84b-c4-perplexity/perplexity2575 --train-weighted-split-paths-path train1b5.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --deepspeed --deepspeed_config ds_configs/3491175.json --zero-stage 0 +START 3491175: Wed 10 May 2023 12:51:48 PM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 46.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 43.0c 80.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 43.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 48.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 44.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 49.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 37.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 37.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 44.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 37.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 46.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 40.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 49.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 45.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 48.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 41.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 45.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 40.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 49.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 46.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 49.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 39.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 45.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 35.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 50.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 39.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 34.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 36.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 48.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 47.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 48.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 48.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 51.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 44.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 44.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 35.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 49.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 37.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 45.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 38.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 40.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 38.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 49.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 44.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 48.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 37.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 36.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== +18: Launching on nid007022 (18/32), master nid005204 port 9999, GPUs 8, CUDA: True +28: Launching on nid007032 (28/32), master nid005204 port 9999, GPUs 8, CUDA: True +23: Launching on nid007027 (23/32), master nid005204 port 9999, GPUs 8, CUDA: True +14: Launching on nid006671 (14/32), master nid005204 port 9999, GPUs 8, CUDA: True +16: Launching on nid006673 (16/32), master nid005204 port 9999, GPUs 8, CUDA: True +11: Launching on nid006668 (11/32), master nid005204 port 9999, GPUs 8, CUDA: True + 5: Launching on nid006662 (5/32), master nid005204 port 9999, GPUs 8, CUDA: True + 9: Launching on nid006666 (9/32), master nid005204 port 9999, GPUs 8, CUDA: True +19: Launching on nid007023 (19/32), master nid005204 port 9999, GPUs 8, CUDA: True +22: Launching on nid007026 (22/32), master nid005204 port 9999, GPUs 8, CUDA: True +30: Launching on nid007034 (30/32), master nid005204 port 9999, GPUs 8, CUDA: True +17: Launching on nid007021 (17/32), master nid005204 port 9999, GPUs 8, CUDA: True + 4: Launching on nid006661 (4/32), master nid005204 port 9999, GPUs 8, CUDA: True + 6: Launching on nid006663 (6/32), master nid005204 port 9999, GPUs 8, CUDA: True +12: Launching on nid006669 (12/32), master nid005204 port 9999, GPUs 8, CUDA: True +24: Launching on nid007028 (24/32), master nid005204 port 9999, GPUs 8, CUDA: True +27: Launching on nid007031 (27/32), master nid005204 port 9999, GPUs 8, CUDA: True +13: Launching on nid006670 (13/32), master nid005204 port 9999, GPUs 8, CUDA: True +21: Launching on nid007025 (21/32), master nid005204 port 9999, GPUs 8, CUDA: True +10: Launching on nid006667 (10/32), master nid005204 port 9999, GPUs 8, CUDA: True + 2: Launching on nid006659 (2/32), master nid005204 port 9999, GPUs 8, CUDA: True +31: Launching on nid007035 (31/32), master nid005204 port 9999, GPUs 8, CUDA: True +29: Launching on nid007033 (29/32), master nid005204 port 9999, GPUs 8, CUDA: True +26: Launching on nid007030 (26/32), master nid005204 port 9999, GPUs 8, CUDA: True + 0: Launching on nid005204 (0/32), master nid005204 port 9999, GPUs 8, CUDA: True + 8: Launching on nid006665 (8/32), master nid005204 port 9999, GPUs 8, CUDA: True + 1: Launching on nid006658 (1/32), master nid005204 port 9999, GPUs 8, CUDA: True + 7: Launching on nid006664 (7/32), master nid005204 port 9999, GPUs 8, CUDA: True + 3: Launching on nid006660 (3/32), master nid005204 port 9999, GPUs 8, CUDA: True +15: Launching on nid006672 (15/32), master nid005204 port 9999, GPUs 8, CUDA: True +25: Launching on nid007029 (25/32), master nid005204 port 9999, GPUs 8, CUDA: True +20: Launching on nid007024 (20/32), master nid005204 port 9999, GPUs 8, CUDA: True + 0: using world size: 256, data-parallel-size: 128, tensor-model-parallel size: 2, pipeline-model-parallel size: 1 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 128 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3491175.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 10240 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 1024 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 2560 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-4b284b84bperplexity2575val + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-4b2-84b-c4-perplexity/perplexity2575 + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 2 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 20 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 34 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 2 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 1 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-4b2-84b-c4-perplexity/perplexity2575 + 0: save_interval ................................... 1000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 2 + 0: tensorboard_dir ................................. tensorboard_4b284b84bperplexity2575val + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 2 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 256 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 4 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 175 dummy tokens (new size: 50432) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-05-10 12:54:36,630] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl +31: > setting tensorboard ... + 0: > initializing tensor model parallel with size 2 + 0: > initializing pipeline model parallel with size 1 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.105 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 87 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 63 + 0: [1/1] c++ scaled_masked_softmax_hip.o scaled_masked_softmax_hip.cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o scaled_masked_softmax_cuda.so + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: ninja: no work to do. + 0: >>> done with compiling and loading fused kernels. Compilation time: 23.345 seconds + 0: time to initialize megatron (seconds): -3.510 + 0: [after megatron is initialized] datetime: 2023-05-10 12:55:08 + 0: building GPT model ... + 0: [2023-05-10 12:55:08,657] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-05-10 12:55:08,658] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-05-10 12:55:08,658] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.69 GB, percent = 7.9% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=0, model=1): 1, ProcessCoord(pipe=0, data=1, model=0): 2, ProcessCoord(pipe=0, data=1, model=1): 3, ProcessCoord(pipe=0, data=2, model=0): 4, ProcessCoord(pipe=0, data=2, model=1): 5, ProcessCoord(pipe=0, data=3, model=0): 6, ProcessCoord(pipe=0, data=3, model=1): 7, ProcessCoord(pipe=0, data=4, model=0): 8, ProcessCoord(pipe=0, data=4, model=1): 9, ProcessCoord(pipe=0, data=5, model=0): 10, ProcessCoord(pipe=0, data=5, model=1): 11, ProcessCoord(pipe=0, data=6, model=0): 12, ProcessCoord(pipe=0, data=6, model=1): 13, ProcessCoord(pipe=0, data=7, model=0): 14, ProcessCoord(pipe=0, data=7, model=1): 15, ProcessCoord(pipe=0, data=8, model=0): 16, ProcessCoord(pipe=0, data=8, model=1): 17, ProcessCoord(pipe=0, data=9, model=0): 18, ProcessCoord(pipe=0, data=9, model=1): 19, ProcessCoord(pipe=0, data=10, model=0): 20, ProcessCoord(pipe=0, data=10, model=1): 21, ProcessCoord(pipe=0, data=11, model=0): 22, ProcessCoord(pipe=0, data + 0: =11, model=1): 23, ProcessCoord(pipe=0, data=12, model=0): 24, ProcessCoord(pipe=0, data=12, model=1): 25, ProcessCoord(pipe=0, data=13, model=0): 26, ProcessCoord(pipe=0, data=13, model=1): 27, ProcessCoord(pipe=0, data=14, model=0): 28, ProcessCoord(pipe=0, data=14, model=1): 29, ProcessCoord(pipe=0, data=15, model=0): 30, ProcessCoord(pipe=0, data=15, model=1): 31, ProcessCoord(pipe=0, data=16, model=0): 32, ProcessCoord(pipe=0, data=16, model=1): 33, ProcessCoord(pipe=0, data=17, model=0): 34, ProcessCoord(pipe=0, data=17, model=1): 35, ProcessCoord(pipe=0, data=18, model=0): 36, ProcessCoord(pipe=0, data=18, model=1): 37, ProcessCoord(pipe=0, data=19, model=0): 38, ProcessCoord(pipe=0, data=19, model=1): 39, ProcessCoord(pipe=0, data=20, model=0): 40, ProcessCoord(pipe=0, data=20, model=1): 41, ProcessCoord(pipe=0, data=21, model=0): 42, ProcessCoord(pipe=0, data=21, model=1): 43, ProcessCoord(pipe=0, data=22, model=0): 44, ProcessCoord(pipe=0, data=22, model=1): 45, ProcessCoord(pipe=0, data=23, model=0 + 0: ): 46, ProcessCoord(pipe=0, data=23, model=1): 47, ProcessCoord(pipe=0, data=24, model=0): 48, ProcessCoord(pipe=0, data=24, model=1): 49, ProcessCoord(pipe=0, data=25, model=0): 50, ProcessCoord(pipe=0, data=25, model=1): 51, ProcessCoord(pipe=0, data=26, model=0): 52, ProcessCoord(pipe=0, data=26, model=1): 53, ProcessCoord(pipe=0, data=27, model=0): 54, ProcessCoord(pipe=0, data=27, model=1): 55, ProcessCoord(pipe=0, data=28, model=0): 56, ProcessCoord(pipe=0, data=28, model=1): 57, ProcessCoord(pipe=0, data=29, model=0): 58, ProcessCoord(pipe=0, data=29, model=1): 59, ProcessCoord(pipe=0, data=30, model=0): 60, ProcessCoord(pipe=0, data=30, model=1): 61, ProcessCoord(pipe=0, data=31, model=0): 62, ProcessCoord(pipe=0, data=31, model=1): 63, ProcessCoord(pipe=0, data=32, model=0): 64, ProcessCoord(pipe=0, data=32, model=1): 65, ProcessCoord(pipe=0, data=33, model=0): 66, ProcessCoord(pipe=0, data=33, model=1): 67, ProcessCoord(pipe=0, data=34, model=0): 68, ProcessCoord(pipe=0, data=34, model=1): 69, Proce + 0: ssCoord(pipe=0, data=35, model=0): 70, ProcessCoord(pipe=0, data=35, model=1): 71, ProcessCoord(pipe=0, data=36, model=0): 72, ProcessCoord(pipe=0, data=36, model=1): 73, ProcessCoord(pipe=0, data=37, model=0): 74, ProcessCoord(pipe=0, data=37, model=1): 75, ProcessCoord(pipe=0, data=38, model=0): 76, ProcessCoord(pipe=0, data=38, model=1): 77, ProcessCoord(pipe=0, data=39, model=0): 78, ProcessCoord(pipe=0, data=39, model=1): 79, ProcessCoord(pipe=0, data=40, model=0): 80, ProcessCoord(pipe=0, data=40, model=1): 81, ProcessCoord(pipe=0, data=41, model=0): 82, ProcessCoord(pipe=0, data=41, model=1): 83, ProcessCoord(pipe=0, data=42, model=0): 84, ProcessCoord(pipe=0, data=42, model=1): 85, ProcessCoord(pipe=0, data=43, model=0): 86, ProcessCoord(pipe=0, data=43, model=1): 87, ProcessCoord(pipe=0, data=44, model=0): 88, ProcessCoord(pipe=0, data=44, model=1): 89, ProcessCoord(pipe=0, data=45, model=0): 90, ProcessCoord(pipe=0, data=45, model=1): 91, ProcessCoord(pipe=0, data=46, model=0): 92, ProcessCoord(pipe + 0: =0, data=46, model=1): 93, ProcessCoord(pipe=0, data=47, model=0): 94, ProcessCoord(pipe=0, data=47, model=1): 95, ProcessCoord(pipe=0, data=48, model=0): 96, ProcessCoord(pipe=0, data=48, model=1): 97, ProcessCoord(pipe=0, data=49, model=0): 98, ProcessCoord(pipe=0, data=49, model=1): 99, ProcessCoord(pipe=0, data=50, model=0): 100, ProcessCoord(pipe=0, data=50, model=1): 101, ProcessCoord(pipe=0, data=51, model=0): 102, ProcessCoord(pipe=0, data=51, model=1): 103, ProcessCoord(pipe=0, data=52, model=0): 104, ProcessCoord(pipe=0, data=52, model=1): 105, ProcessCoord(pipe=0, data=53, model=0): 106, ProcessCoord(pipe=0, data=53, model=1): 107, ProcessCoord(pipe=0, data=54, model=0): 108, ProcessCoord(pipe=0, data=54, model=1): 109, ProcessCoord(pipe=0, data=55, model=0): 110, ProcessCoord(pipe=0, data=55, model=1): 111, ProcessCoord(pipe=0, data=56, model=0): 112, ProcessCoord(pipe=0, data=56, model=1): 113, ProcessCoord(pipe=0, data=57, model=0): 114, ProcessCoord(pipe=0, data=57, model=1): 115, ProcessCoord( + 0: pipe=0, data=58, model=0): 116, ProcessCoord(pipe=0, data=58, model=1): 117, ProcessCoord(pipe=0, data=59, model=0): 118, ProcessCoord(pipe=0, data=59, model=1): 119, ProcessCoord(pipe=0, data=60, model=0): 120, ProcessCoord(pipe=0, data=60, model=1): 121, ProcessCoord(pipe=0, data=61, model=0): 122, ProcessCoord(pipe=0, data=61, model=1): 123, ProcessCoord(pipe=0, data=62, model=0): 124, ProcessCoord(pipe=0, data=62, model=1): 125, ProcessCoord(pipe=0, data=63, model=0): 126, ProcessCoord(pipe=0, data=63, model=1): 127, ProcessCoord(pipe=0, data=64, model=0): 128, ProcessCoord(pipe=0, data=64, model=1): 129, ProcessCoord(pipe=0, data=65, model=0): 130, ProcessCoord(pipe=0, data=65, model=1): 131, ProcessCoord(pipe=0, data=66, model=0): 132, ProcessCoord(pipe=0, data=66, model=1): 133, ProcessCoord(pipe=0, data=67, model=0): 134, ProcessCoord(pipe=0, data=67, model=1): 135, ProcessCoord(pipe=0, data=68, model=0): 136, ProcessCoord(pipe=0, data=68, model=1): 137, ProcessCoord(pipe=0, data=69, model=0): 138, Pr + 0: ocessCoord(pipe=0, data=69, model=1): 139, ProcessCoord(pipe=0, data=70, model=0): 140, ProcessCoord(pipe=0, data=70, model=1): 141, ProcessCoord(pipe=0, data=71, model=0): 142, ProcessCoord(pipe=0, data=71, model=1): 143, ProcessCoord(pipe=0, data=72, model=0): 144, ProcessCoord(pipe=0, data=72, model=1): 145, ProcessCoord(pipe=0, data=73, model=0): 146, ProcessCoord(pipe=0, data=73, model=1): 147, ProcessCoord(pipe=0, data=74, model=0): 148, ProcessCoord(pipe=0, data=74, model=1): 149, ProcessCoord(pipe=0, data=75, model=0): 150, ProcessCoord(pipe=0, data=75, model=1): 151, ProcessCoord(pipe=0, data=76, model=0): 152, ProcessCoord(pipe=0, data=76, model=1): 153, ProcessCoord(pipe=0, data=77, model=0): 154, ProcessCoord(pipe=0, data=77, model=1): 155, ProcessCoord(pipe=0, data=78, model=0): 156, ProcessCoord(pipe=0, data=78, model=1): 157, ProcessCoord(pipe=0, data=79, model=0): 158, ProcessCoord(pipe=0, data=79, model=1): 159, ProcessCoord(pipe=0, data=80, model=0): 160, ProcessCoord(pipe=0, data=80, model= + 0: 1): 161, ProcessCoord(pipe=0, data=81, model=0): 162, ProcessCoord(pipe=0, data=81, model=1): 163, ProcessCoord(pipe=0, data=82, model=0): 164, ProcessCoord(pipe=0, data=82, model=1): 165, ProcessCoord(pipe=0, data=83, model=0): 166, ProcessCoord(pipe=0, data=83, model=1): 167, ProcessCoord(pipe=0, data=84, model=0): 168, ProcessCoord(pipe=0, data=84, model=1): 169, ProcessCoord(pipe=0, data=85, model=0): 170, ProcessCoord(pipe=0, data=85, model=1): 171, ProcessCoord(pipe=0, data=86, model=0): 172, ProcessCoord(pipe=0, data=86, model=1): 173, ProcessCoord(pipe=0, data=87, model=0): 174, ProcessCoord(pipe=0, data=87, model=1): 175, ProcessCoord(pipe=0, data=88, model=0): 176, ProcessCoord(pipe=0, data=88, model=1): 177, ProcessCoord(pipe=0, data=89, model=0): 178, ProcessCoord(pipe=0, data=89, model=1): 179, ProcessCoord(pipe=0, data=90, model=0): 180, ProcessCoord(pipe=0, data=90, model=1): 181, ProcessCoord(pipe=0, data=91, model=0): 182, ProcessCoord(pipe=0, data=91, model=1): 183, ProcessCoord(pipe=0, data + 0: =92, model=0): 184, ProcessCoord(pipe=0, data=92, model=1): 185, ProcessCoord(pipe=0, data=93, model=0): 186, ProcessCoord(pipe=0, data=93, model=1): 187, ProcessCoord(pipe=0, data=94, model=0): 188, ProcessCoord(pipe=0, data=94, model=1): 189, ProcessCoord(pipe=0, data=95, model=0): 190, ProcessCoord(pipe=0, data=95, model=1): 191, ProcessCoord(pipe=0, data=96, model=0): 192, ProcessCoord(pipe=0, data=96, model=1): 193, ProcessCoord(pipe=0, data=97, model=0): 194, ProcessCoord(pipe=0, data=97, model=1): 195, ProcessCoord(pipe=0, data=98, model=0): 196, ProcessCoord(pipe=0, data=98, model=1): 197, ProcessCoord(pipe=0, data=99, model=0): 198, ProcessCoord(pipe=0, data=99, model=1): 199, ProcessCoord(pipe=0, data=100, model=0): 200, ProcessCoord(pipe=0, data=100, model=1): 201, ProcessCoord(pipe=0, data=101, model=0): 202, ProcessCoord(pipe=0, data=101, model=1): 203, ProcessCoord(pipe=0, data=102, model=0): 204, ProcessCoord(pipe=0, data=102, model=1): 205, ProcessCoord(pipe=0, data=103, model=0): 206, Process + 0: Coord(pipe=0, data=103, model=1): 207, ProcessCoord(pipe=0, data=104, model=0): 208, ProcessCoord(pipe=0, data=104, model=1): 209, ProcessCoord(pipe=0, data=105, model=0): 210, ProcessCoord(pipe=0, data=105, model=1): 211, ProcessCoord(pipe=0, data=106, model=0): 212, ProcessCoord(pipe=0, data=106, model=1): 213, ProcessCoord(pipe=0, data=107, model=0): 214, ProcessCoord(pipe=0, data=107, model=1): 215, ProcessCoord(pipe=0, data=108, model=0): 216, ProcessCoord(pipe=0, data=108, model=1): 217, ProcessCoord(pipe=0, data=109, model=0): 218, ProcessCoord(pipe=0, data=109, model=1): 219, ProcessCoord(pipe=0, data=110, model=0): 220, ProcessCoord(pipe=0, data=110, model=1): 221, ProcessCoord(pipe=0, data=111, model=0): 222, ProcessCoord(pipe=0, data=111, model=1): 223, ProcessCoord(pipe=0, data=112, model=0): 224, ProcessCoord(pipe=0, data=112, model=1): 225, ProcessCoord(pipe=0, data=113, model=0): 226, ProcessCoord(pipe=0, data=113, model=1): 227, ProcessCoord(pipe=0, data=114, model=0): 228, ProcessCoord(pipe=0 + 0: , data=114, model=1): 229, ProcessCoord(pipe=0, data=115, model=0): 230, ProcessCoord(pipe=0, data=115, model=1): 231, ProcessCoord(pipe=0, data=116, model=0): 232, ProcessCoord(pipe=0, data=116, model=1): 233, ProcessCoord(pipe=0, data=117, model=0): 234, ProcessCoord(pipe=0, data=117, model=1): 235, ProcessCoord(pipe=0, data=118, model=0): 236, ProcessCoord(pipe=0, data=118, model=1): 237, ProcessCoord(pipe=0, data=119, model=0): 238, ProcessCoord(pipe=0, data=119, model=1): 239, ProcessCoord(pipe=0, data=120, model=0): 240, ProcessCoord(pipe=0, data=120, model=1): 241, ProcessCoord(pipe=0, data=121, model=0): 242, ProcessCoord(pipe=0, data=121, model=1): 243, ProcessCoord(pipe=0, data=122, model=0): 244, ProcessCoord(pipe=0, data=122, model=1): 245, ProcessCoord(pipe=0, data=123, model=0): 246, ProcessCoord(pipe=0, data=123, model=1): 247, ProcessCoord(pipe=0, data=124, model=0): 248, ProcessCoord(pipe=0, data=124, model=1): 249, ProcessCoord(pipe=0, data=125, model=0): 250, ProcessCoord(pipe=0, data=125, + 0: model=1): 251, ProcessCoord(pipe=0, data=126, model=0): 252, ProcessCoord(pipe=0, data=126, model=1): 253, ProcessCoord(pipe=0, data=127, model=0): 254, ProcessCoord(pipe=0, data=127, model=1): 255} + 0: [2023-05-10 12:55:14,091] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=41 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: undo + 0: 38: MixedFusedLayerNorm + 0: 39: EmbeddingPipe + 0: 40: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-05-10 12:55:14,543] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-05-10 12:55:14,543] [INFO] [utils.py:828:see_memory_usage] MA 2.7 GB Max_MA 2.7 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:14,543] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.84 GB, percent = 7.9% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-05-10 12:55:14,546] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-05-10 12:55:20,478] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-05-10 12:55:20,479] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-05-10 12:55:20,479] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-05-10 12:55:20,499] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-05-10 12:55:20,499] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-05-10 12:55:20,628] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-05-10 12:55:20,629] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.71 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:20,629] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.5 GB, percent = 8.0% + 0: ninja: no work to do. + 0: Time to load utils op: 0.39843320846557617 seconds + 0: Time to load utils op: 0.2857973575592041 seconds + 0: Time to load utils op: 0.3982274532318115 seconds + 0: Time to load utils op: 0.3990907669067383 seconds +16: Time to load utils op: 0.38068366050720215 seconds +16: Time to load utils op: 0.3806929588317871 seconds +16: Time to load utils op: 0.380704402923584 seconds +16: Time to load utils op: 0.3807191848754883 seconds +14: Time to load utils op: 0.3983590602874756 secondsTime to load utils op: 0.39940762519836426 seconds +14: +14: Time to load utils op: 0.39934396743774414 seconds +14: Time to load utils op: 0.39859437942504883 seconds +25: Time to load utils op: 0.3937692642211914 seconds +25: Time to load utils op: 0.3936350345611572 secondsTime to load utils op: 0.3939485549926758 seconds +25: +25: Time to load utils op: 0.3939359188079834 seconds + 2: Time to load utils op: 0.4049384593963623 seconds + 2: Time to load utils op: 0.4051516056060791 secondsTime to load utils op: 0.40526461601257324 seconds + 2: + 2: Time to load utils op: 0.40527772903442383 seconds + 5: Time to load utils op: 0.40476512908935547 seconds + 5: Time to load utils op: 0.4046142101287842 seconds + 5: Time to load utils op: 0.4046609401702881 seconds + 5: Time to load utils op: 0.4048013687133789 seconds + 9: Time to load utils op: 0.3825509548187256 seconds + 9: Time to load utils op: 0.38256216049194336 seconds + 9: Time to load utils op: 0.3825716972351074 seconds + 9: Time to load utils op: 0.382580041885376 seconds + 8: Time to load utils op: 0.3827188014984131 seconds + 8: Time to load utils op: 0.3827383518218994 secondsTime to load utils op: 0.3827400207519531 seconds + 8: + 8: Time to load utils op: 0.3827509880065918 seconds +27: Time to load utils op: 0.394132137298584 seconds +27: Time to load utils op: 0.3946866989135742 seconds +27: Time to load utils op: 0.3937036991119385 seconds +27: Time to load utils op: 0.39438676834106445 seconds +26: Time to load utils op: 0.39467883110046387 secondsTime to load utils op: 0.39495134353637695 seconds +26: +26: Time to load utils op: 0.3952302932739258 seconds +26: Time to load utils op: 0.39476966857910156 seconds +17: Time to load utils op: 0.3836205005645752 secondsTime to load utils op: 0.3836231231689453 seconds +17: +17: Time to load utils op: 0.3836333751678467 seconds +17: Time to load utils op: 0.3836507797241211 seconds +23: Time to load utils op: 0.3836054801940918 seconds +23: Time to load utils op: 0.38361120223999023 secondsTime to load utils op: 0.383620023727417 seconds +23: +23: Time to load utils op: 0.3836240768432617 seconds + 7: Time to load utils op: 0.3843414783477783 seconds + 7: Time to load utils op: 0.3843345642089844 seconds + 7: Time to load utils op: 0.38437485694885254 seconds + 7: Time to load utils op: 0.3843822479248047 seconds + 6: Time to load utils op: 0.38382768630981445 seconds + 6: Time to load utils op: 0.38384246826171875 seconds + 6: Time to load utils op: 0.3838469982147217 seconds + 6: Time to load utils op: 0.38385486602783203 seconds + 4: Time to load utils op: 0.38483500480651855 seconds + 4: Time to load utils op: 0.38491225242614746 seconds + 4: Time to load utils op: 0.3849167823791504 seconds + 4: Time to load utils op: 0.3849315643310547 seconds +24: Time to load utils op: 0.3843379020690918 seconds +24: Time to load utils op: 0.3843395709991455 seconds +24: Time to load utils op: 0.38434314727783203 seconds +24: Time to load utils op: 0.3843514919281006 seconds +15: Time to load utils op: 0.38430285453796387 secondsTime to load utils op: 0.38430309295654297 secondsTime to load utils op: 0.3843057155609131 seconds +15: +15: +15: Time to load utils op: 0.38429951667785645 seconds +10: Time to load utils op: 0.38466644287109375 secondsTime to load utils op: 0.38468480110168457 seconds +10: +10: Time to load utils op: 0.3846890926361084 secondsTime to load utils op: 0.3846883773803711 seconds +10: +28: Time to load utils op: 0.3844900131225586 seconds +28: Time to load utils op: 0.38451647758483887 seconds +28: Time to load utils op: 0.3845193386077881 secondsTime to load utils op: 0.3845233917236328 seconds +28: +12: Time to load utils op: 0.38474607467651367 secondsTime to load utils op: 0.38474082946777344 seconds +12: +12: Time to load utils op: 0.38475918769836426 seconds +12: Time to load utils op: 0.3847658634185791 seconds +18: Time to load utils op: 0.3841886520385742 secondsTime to load utils op: 0.38420677185058594 seconds +18: +18: Time to load utils op: 0.3842189311981201 seconds +18: Time to load utils op: 0.3842315673828125 seconds +21: Time to load utils op: 0.38432931900024414 seconds +21: Time to load utils op: 0.38434672355651855 seconds +21: Time to load utils op: 0.38434600830078125 seconds +21: Time to load utils op: 0.3843538761138916 seconds +29: Time to load utils op: 0.38440632820129395 secondsTime to load utils op: 0.38441967964172363 seconds +29: +29: Time to load utils op: 0.3844325542449951 seconds + 3: Time to load utils op: 0.3843505382537842 secondsTime to load utils op: 0.38435935974121094 seconds + 3: + 3: Time to load utils op: 0.3843722343444824 seconds +20: Time to load utils op: 0.38451075553894043 secondsTime to load utils op: 0.38451242446899414 seconds +20: +20: Time to load utils op: 0.3845198154449463 secondsTime to load utils op: 0.3845186233520508 seconds +20: +29: Time to load utils op: 0.3844294548034668 seconds + 3: Time to load utils op: 0.3843865394592285 seconds + 1: Time to load utils op: 0.38438868522644043 secondsTime to load utils op: 0.38439488410949707 seconds + 1: + 1: Time to load utils op: 0.38442254066467285 seconds + 1: Time to load utils op: 0.3844187259674072 seconds +11: Time to load utils op: 0.38499999046325684 seconds +11: Time to load utils op: 0.3850212097167969 secondsTime to load utils op: 0.3850221633911133 seconds +11: +11: Time to load utils op: 0.3850443363189697 seconds +22: Time to load utils op: 0.38481593132019043 secondsTime to load utils op: 0.3848123550415039 seconds +22: +22: Time to load utils op: 0.3848278522491455 seconds +22: Time to load utils op: 0.3848421573638916 seconds +19: Time to load utils op: 0.3850531578063965 seconds +19: Time to load utils op: 0.3850703239440918 seconds +19: Time to load utils op: 0.3850867748260498 seconds +19: Time to load utils op: 0.3851001262664795 seconds +31: Time to load utils op: 0.38488197326660156 secondsTime to load utils op: 0.3848836421966553 seconds +31: +31: Time to load utils op: 0.38489389419555664 seconds +13: Time to load utils op: 0.38498806953430176 seconds +13: Time to load utils op: 0.38500142097473145 seconds +13: Time to load utils op: 0.3850138187408447 seconds +31: Time to load utils op: 0.3849151134490967 seconds +13: Time to load utils op: 0.3850128650665283 seconds +30: Time to load utils op: 0.38535404205322266 secondsTime to load utils op: 0.38536500930786133 seconds +30: +30: Time to load utils op: 0.3853728771209717 seconds +30: Time to load utils op: 0.3853740692138672 seconds + 0: [2023-05-10 12:55:21,039] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-05-10 12:55:21,039] [INFO] [utils.py:828:see_memory_usage] MA 2.69 GB Max_MA 2.69 GB CA 2.77 GB Max_CA 3 GB + 0: [2023-05-10 12:55:21,039] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.51 GB, percent = 8.1% + 4: Time to load utils op: 0.0009138584136962891 seconds + 4: Time to load utils op: 0.0009343624114990234 seconds + 4: Time to load utils op: 0.0008609294891357422 seconds + 4: Time to load utils op: 0.0009624958038330078 seconds +19: Time to load utils op: 0.0008223056793212891 seconds +19: Time to load utils op: 0.0009465217590332031 seconds +19: Time to load utils op: 0.0009133815765380859 seconds +19: Time to load utils op: 0.0009613037109375 seconds + 5: Time to load utils op: 0.0009624958038330078 seconds + 5: Time to load utils op: 0.0011365413665771484 seconds + 5: Time to load utils op: 0.001129150390625 seconds + 5: Time to load utils op: 0.0011875629425048828 seconds +27: Time to load utils op: 0.0009686946868896484 seconds +27: Time to load utils op: 0.0010118484497070312 secondsTime to load utils op: 0.0009264945983886719 seconds +27: +27: Time to load utils op: 0.0010631084442138672 seconds + 8: Time to load utils op: 0.0008752346038818359 seconds + 8: Time to load utils op: 0.0009503364562988281 secondsTime to load utils op: 0.0009224414825439453 seconds + 8: + 8: Time to load utils op: 0.0009593963623046875 seconds + 0: Time to load utils op: 0.0005867481231689453 seconds +13: Time to load utils op: 0.0007822513580322266 seconds +13: Time to load utils op: 0.0008528232574462891 seconds +13: Time to load utils op: 0.0007760524749755859 seconds + 0: Time to load utils op: 0.0006206035614013672 seconds +13: Time to load utils op: 0.0009663105010986328 seconds + 2: Time to load utils op: 0.0009794235229492188 seconds + 2: Time to load utils op: 0.0009000301361083984 secondsTime to load utils op: 0.0010306835174560547 seconds + 2: + 2: Time to load utils op: 0.0009710788726806641 seconds + 0: Time to load utils op: 0.0005583763122558594 seconds + 1: Time to load utils op: 0.0007879734039306641 seconds + 1: Time to load utils op: 0.0007989406585693359 seconds + 1: Time to load utils op: 0.0007028579711914062 seconds + 1: Time to load utils op: 0.0009543895721435547 seconds +28: Time to load utils op: 0.0007658004760742188 seconds +28: Time to load utils op: 0.0009243488311767578 seconds +28: Time to load utils op: 0.0009062290191650391 seconds +28: Time to load utils op: 0.0008702278137207031 seconds +16: Time to load utils op: 0.0008070468902587891 seconds +16: Time to load utils op: 0.0008897781372070312 seconds +16: Time to load utils op: 0.0008912086486816406 seconds +16: Time to load utils op: 0.0009763240814208984 seconds + 3: Time to load utils op: 0.0007851123809814453 seconds + 3: Time to load utils op: 0.0008833408355712891 secondsTime to load utils op: 0.0008769035339355469 seconds + 3: +10: Time to load utils op: 0.0008251667022705078 seconds +10: Time to load utils op: 0.0009071826934814453 seconds +10: Time to load utils op: 0.0009107589721679688 seconds + 3: Time to load utils op: 0.0008814334869384766 seconds +10: Time to load utils op: 0.0009133815765380859 seconds + 6: Time to load utils op: 0.0007283687591552734 seconds + 6: Time to load utils op: 0.0010137557983398438 secondsTime to load utils op: 0.001062631607055664 seconds + 6: + 6: Time to load utils op: 0.0010557174682617188 seconds +14: Time to load utils op: 0.0008955001831054688 seconds +14: Time to load utils op: 0.001056671142578125 secondsTime to load utils op: 0.0010039806365966797 seconds +14: +26: Time to load utils op: 0.0009753704071044922 secondsTime to load utils op: 0.0009958744049072266 seconds +26: +26: Time to load utils op: 0.0009763240814208984 seconds +14: Time to load utils op: 0.0010204315185546875 seconds +26: Time to load utils op: 0.0010285377502441406 seconds +25: Time to load utils op: 0.00080108642578125 seconds +25: Time to load utils op: 0.0009386539459228516 seconds +25: Time to load utils op: 0.0009469985961914062 seconds +25: Time to load utils op: 0.0008554458618164062 seconds +12: Time to load utils op: 0.0009882450103759766 seconds +12: Time to load utils op: 0.0010058879852294922 seconds +12: Time to load utils op: 0.0009942054748535156 seconds +15: Time to load utils op: 0.0009305477142333984 seconds +15: Time to load utils op: 0.0008981227874755859 seconds +15: Time to load utils op: 0.0008883476257324219 seconds +12: Time to load utils op: 0.0010068416595458984 seconds +15: Time to load utils op: 0.0009179115295410156 seconds +20: Time to load utils op: 0.0009202957153320312 seconds +20: Time to load utils op: 0.0009641647338867188 seconds +20: Time to load utils op: 0.0009684562683105469 seconds +20: Time to load utils op: 0.0009965896606445312 seconds +22: Time to load utils op: 0.0007548332214355469 seconds +22: Time to load utils op: 0.0008208751678466797 seconds +22: Time to load utils op: 0.0007944107055664062 seconds +22: Time to load utils op: 0.0008943080902099609 seconds +31: Time to load utils op: 0.0009613037109375 secondsTime to load utils op: 0.0009551048278808594 seconds +31: +31: Time to load utils op: 0.0008699893951416016 seconds +31: Time to load utils op: 0.0009908676147460938 seconds +23: Time to load utils op: 0.0005791187286376953 seconds +23: Time to load utils op: 0.000782012939453125 seconds +23: Time to load utils op: 0.000835418701171875 seconds +24: Time to load utils op: 0.0008823871612548828 secondsTime to load utils op: 0.0008943080902099609 secondsTime to load utils op: 0.000896453857421875 seconds +24: +24: +23: Time to load utils op: 0.0009253025054931641 seconds +24: Time to load utils op: 0.0008976459503173828 seconds +29: Time to load utils op: 0.000873565673828125 seconds +29: Time to load utils op: 0.0009567737579345703 seconds +29: Time to load utils op: 0.0009572505950927734 seconds +29: Time to load utils op: 0.0009591579437255859 seconds +21: Time to load utils op: 0.001004934310913086 seconds +21: Time to load utils op: 0.0009722709655761719 seconds +21: Time to load utils op: 0.0010285377502441406 seconds +21: Time to load utils op: 0.0011212825775146484 seconds +17: Time to load utils op: 0.0008115768432617188 seconds +18: Time to load utils op: 0.0006983280181884766 seconds +17: Time to load utils op: 0.0008342266082763672 secondsTime to load utils op: 0.0008344650268554688 seconds +17: +17: Time to load utils op: 0.000904083251953125 seconds +18: Time to load utils op: 0.0007822513580322266 seconds +18: Time to load utils op: 0.0007233619689941406 seconds +18: Time to load utils op: 0.0008704662322998047 seconds +11: Time to load utils op: 0.0006849765777587891 secondsTime to load utils op: 0.0006310939788818359 seconds +11: +11: Time to load utils op: 0.0008370876312255859 seconds +11: Time to load utils op: 0.0008959770202636719 seconds + 0: [2023-05-10 12:55:21,228] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 +30: Time to load utils op: 0.0007119178771972656 seconds +30: Time to load utils op: 0.0007691383361816406 secondsTime to load utils op: 0.0007715225219726562 seconds +30: +30: Time to load utils op: 0.0008294582366943359 seconds + 0: [2023-05-10 12:55:21,229] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:55:21,229] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.59 GB, percent = 8.1% + 7: Time to load utils op: 0.0008444786071777344 seconds + 7: Time to load utils op: 0.0009179115295410156 seconds + 7: Time to load utils op: 0.0009171962738037109 seconds + 7: Time to load utils op: 0.0009794235229492188 seconds + 9: Time to load utils op: 0.0008203983306884766 seconds + 9: Time to load utils op: 0.0007684230804443359 seconds + 9: Time to load utils op: 0.0006110668182373047 seconds + 9: Time to load utils op: 0.0009212493896484375 seconds + 0: [2023-05-10 12:55:21,346] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-05-10 12:55:21,347] [INFO] [utils.py:828:see_memory_usage] MA 5.38 GB Max_MA 5.38 GB CA 6.82 GB Max_CA 7 GB + 0: [2023-05-10 12:55:21,347] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.63 GB, percent = 8.1% + 0: [2023-05-10 12:55:21,467] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-05-10 12:55:21,467] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,467] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.6 GB, percent = 8.1% + 0: [2023-05-10 12:55:21,584] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-05-10 12:55:21,585] [INFO] [utils.py:828:see_memory_usage] MA 7.9 GB Max_MA 7.9 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,585] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.65 GB, percent = 8.1% + 0: [2023-05-10 12:55:21,705] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-05-10 12:55:21,706] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,706] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.69 GB, percent = 8.1% + 0: ninja: no work to do. + 0: Time to load utils op: 0.3561413288116455 seconds +18: Time to load utils op: 0.304502010345459 secondsTime to load utils op: 0.3045063018798828 secondsTime to load utils op: 0.30444836616516113 seconds +18: +18: +18: Time to load utils op: 0.3049352169036865 seconds + 1: Time to load utils op: 0.312896728515625 seconds +15: Time to load utils op: 0.31400012969970703 seconds + 1: Time to load utils op: 0.3186779022216797 seconds + 7: Time to load utils op: 0.34078335762023926 seconds +15: Time to load utils op: 0.31989502906799316 seconds +15: Time to load utils op: 0.32010602951049805 seconds +15: Time to load utils op: 0.3208456039428711 seconds + 1: Time to load utils op: 0.3372960090637207 seconds + 7: Time to load utils op: 0.3466484546661377 seconds +14: Time to load utils op: 0.3526341915130615 seconds + 1: Time to load utils op: 0.33113622665405273 seconds + 7: Time to load utils op: 0.3524327278137207 seconds + 2: Time to load utils op: 0.36229753494262695 seconds +26: Time to load utils op: 0.35007333755493164 seconds +14: Time to load utils op: 0.35930347442626953 seconds + 7: Time to load utils op: 0.35884642601013184 seconds + 2: Time to load utils op: 0.3677353858947754 seconds +26: Time to load utils op: 0.354996919631958 seconds +14: Time to load utils op: 0.3656783103942871 seconds + 2: Time to load utils op: 0.3746356964111328 seconds +26: Time to load utils op: 0.3622152805328369 seconds +14: Time to load utils op: 0.3719451427459717 seconds +30: Time to load utils op: 0.3441746234893799 seconds + 2: Time to load utils op: 0.38053202629089355 seconds +26: Time to load utils op: 0.36810755729675293 seconds + 0: [2023-05-10 12:55:21,819] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 0: [2023-05-10 12:55:21,820] [INFO] [utils.py:828:see_memory_usage] MA 7.91 GB Max_MA 7.91 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,820] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.7 GB, percent = 8.1% +30: Time to load utils op: 0.33437681198120117 seconds +28: Time to load utils op: 0.3707239627838135 seconds +12: Time to load utils op: 0.3252987861633301 seconds +31: Time to load utils op: 0.34109950065612793 seconds +20: Time to load utils op: 0.3461167812347412 seconds +23: Time to load utils op: 0.31858348846435547 seconds + 5: Time to load utils op: 0.34891748428344727 seconds +11: Time to load utils op: 0.3170452117919922 seconds +30: Time to load utils op: 0.3405799865722656 seconds +28: Time to load utils op: 0.3768308162689209 seconds +31: Time to load utils op: 0.3503255844116211 seconds +12: Time to load utils op: 0.33144068717956543 seconds +21: Time to load utils op: 0.3406546115875244 seconds +22: Time to load utils op: 0.34393763542175293 seconds + 8: Time to load utils op: 0.31956958770751953 seconds + 3: Time to load utils op: 0.32199978828430176 seconds +20: Time to load utils op: 0.3522963523864746 seconds +23: Time to load utils op: 0.32462334632873535 seconds +11: Time to load utils op: 0.3228719234466553 seconds + 5: Time to load utils op: 0.3551974296569824 seconds +30: Time to load utils op: 0.3467392921447754 seconds +28: Time to load utils op: 0.3827247619628906 seconds +12: Time to load utils op: 0.34080004692077637 seconds +17: Time to load utils op: 0.33420348167419434 seconds +31: Time to load utils op: 0.3516561985015869 seconds +24: Time to load utils op: 0.30718040466308594 seconds +28: Time to load utils op: 0.3862419128417969 seconds +22: Time to load utils op: 0.349719762802124 seconds +21: Time to load utils op: 0.3312406539916992 seconds +19: Time to load utils op: 0.30982136726379395 seconds +16: Time to load utils op: 0.30569005012512207 seconds +23: Time to load utils op: 0.33040785789489746 seconds + 8: Time to load utils op: 0.32557082176208496 seconds +20: Time to load utils op: 0.3583652973175049 seconds + 3: Time to load utils op: 0.33432602882385254 seconds +11: Time to load utils op: 0.3291609287261963 seconds + 5: Time to load utils op: 0.36118316650390625 seconds + 4: Time to load utils op: 0.3246324062347412 seconds +27: Time to load utils op: 0.39118456840515137 seconds +25: Time to load utils op: 0.3918640613555908 seconds +12: Time to load utils op: 0.34688353538513184 seconds +31: Time to load utils op: 0.3561971187591553 seconds +17: Time to load utils op: 0.34038567543029785 seconds +21: Time to load utils op: 0.3344581127166748 seconds + 9: Time to load utils op: 0.32217860221862793 seconds + 6: Time to load utils op: 0.31875038146972656 seconds +13: Time to load utils op: 0.318892240524292 seconds +10: Time to load utils op: 0.3226628303527832 seconds +24: Time to load utils op: 0.31356287002563477 seconds +19: Time to load utils op: 0.3158416748046875 seconds +22: Time to load utils op: 0.3564019203186035 seconds + 8: Time to load utils op: 0.3468170166015625 seconds + 3: Time to load utils op: 0.33389735221862793 seconds +20: Time to load utils op: 0.3642909526824951 seconds +16: Time to load utils op: 0.31172609329223633 seconds +23: Time to load utils op: 0.35012149810791016 seconds + 6: Time to load utils op: 0.3220679759979248 seconds +11: Time to load utils op: 0.33516573905944824 seconds + 5: Time to load utils op: 0.367159366607666 seconds + 4: Time to load utils op: 0.33056020736694336 seconds +27: Time to load utils op: 0.3968689441680908 seconds +25: Time to load utils op: 0.39916300773620605 seconds +21: Time to load utils op: 0.34029531478881836 seconds +17: Time to load utils op: 0.3461787700653076 seconds + 9: Time to load utils op: 0.32847023010253906 seconds +29: Time to load utils op: 0.31298160552978516 seconds +10: Time to load utils op: 0.3347628116607666 seconds +13: Time to load utils op: 0.3250114917755127 seconds +24: Time to load utils op: 0.31929945945739746 seconds + 6: Time to load utils op: 0.32855653762817383 seconds +19: Time to load utils op: 0.32192254066467285 seconds +22: Time to load utils op: 0.3621211051940918 seconds + 8: Time to load utils op: 0.3376352787017822 seconds + 3: Time to load utils op: 0.3400411605834961 seconds +16: Time to load utils op: 0.3178989887237549 seconds + 4: Time to load utils op: 0.3370387554168701 seconds +27: Time to load utils op: 0.4026496410369873 seconds +25: Time to load utils op: 0.40415358543395996 seconds + 9: Time to load utils op: 0.33424830436706543 seconds +10: Time to load utils op: 0.34081482887268066 seconds +15: Time to load utils op: 0.004193544387817383 seconds +17: Time to load utils op: 0.35229945182800293 seconds +13: Time to load utils op: 0.3311307430267334 seconds +29: Time to load utils op: 0.3191258907318115 seconds +24: Time to load utils op: 0.3254818916320801 seconds +16: Time to load utils op: 0.32370829582214355 seconds +19: Time to load utils op: 0.3282806873321533 seconds +13: Time to load utils op: 0.3339724540710449 seconds + 6: Time to load utils op: 0.33457255363464355 seconds + 9: Time to load utils op: 0.34035706520080566 seconds +29: Time to load utils op: 0.324845552444458 seconds + 4: Time to load utils op: 0.34278106689453125 seconds +27: Time to load utils op: 0.4092378616333008 seconds +25: Time to load utils op: 0.4104018211364746 seconds +10: Time to load utils op: 0.3469252586364746 seconds +15: Time to load utils op: 0.0004279613494873047 secondsTime to load utils op: 0.0004317760467529297 secondsTime to load utils op: 0.00043201446533203125 seconds +15: +15: + 0: Time to load utils op: 0.42562031745910645 seconds + 0: Time to load utils op: 0.42539238929748535 seconds + 0: Time to load utils op: 0.4241955280303955 seconds +29: Time to load utils op: 0.3310227394104004 seconds +18: Time to load utils op: 0.0038771629333496094 seconds +18: Time to load utils op: 0.004416704177856445 secondsTime to load utils op: 0.004410505294799805 seconds +18: +18: Time to load utils op: 0.004395008087158203 seconds + 0: Time to load utils op: 0.0029320716857910156 seconds + 0: [2023-05-10 12:55:21,985] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-05-10 12:55:21,986] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:21,986] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.67 GB, percent = 8.1% + 0: Time to load utils op: 0.00040650367736816406 seconds + 0: Time to load utils op: 0.00037741661071777344 seconds + 0: Time to load utils op: 0.0004291534423828125 seconds +22: Time to load utils op: 0.0049474239349365234 secondsTime to load utils op: 0.00493621826171875 seconds +22: +22: Time to load utils op: 0.0048139095306396484 seconds +22: Time to load utils op: 0.004759550094604492 seconds +11: Time to load utils op: 0.005495309829711914 seconds +11: Time to load utils op: 0.005421638488769531 secondsTime to load utils op: 0.0058155059814453125 seconds +11: +11: Time to load utils op: 0.005858182907104492 seconds + 9: Time to load utils op: 0.004332780838012695 seconds + 9: Time to load utils op: 0.0036306381225585938 secondsTime to load utils op: 0.0038976669311523438 seconds + 9: + 9: Time to load utils op: 0.004007577896118164 seconds + 0: [2023-05-10 12:55:22,110] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-05-10 12:55:22,111] [INFO] [utils.py:828:see_memory_usage] MA 7.99 GB Max_MA 7.99 GB CA 10.63 GB Max_CA 11 GB + 0: [2023-05-10 12:55:22,111] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.63 GB, percent = 8.1% + 0: [2023-05-10 12:55:22,111] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-05-10 12:55:22,111] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-05-10 12:55:22,111] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-05-10 12:55:22,111] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-05-10 12:55:22,112] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-05-10 12:55:22,112] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-05-10 12:55:22,112] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-05-10 12:55:22,112] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-05-10 12:55:22,112] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 4 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-05-10 12:55:22,113] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] train_batch_size ............. 1024 + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 2 + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] world_size ................... 128 + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-05-10 12:55:22,114] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 2, + 0: "train_batch_size": 1.024000e+03, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.000438690185546875 seconds + 0: [2023-05-10 12:55:22,115] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=4 micro_batch_size=2 + 0: [2023-05-10 12:55:22,137] [INFO] [engine.py:145:__init__] RANK=1 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) + 0: [2023-05-10 12:55:22,138] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=1407562240 (1407.562M) TOTAL_PARAMS=2815124480 (2815.124M) UNIQUE_PARAMS=2815124480 (2815.124M) +31: Time to load utils op: 0.0066623687744140625 seconds +31: Time to load utils op: 0.002371549606323242 seconds +31: Time to load utils op: 0.0004734992980957031 seconds +31: Time to load utils op: 0.0004203319549560547 seconds + 1: Time to load utils op: 0.0037431716918945312 secondsTime to load utils op: 0.0037496089935302734 seconds + 1: + 1: Time to load utils op: 0.0005588531494140625 seconds +26: Time to load utils op: 0.004046916961669922 seconds +26: Time to load utils op: 0.00034999847412109375 seconds + 2: Time to load utils op: 0.0039637088775634766 secondsTime to load utils op: 0.00396728515625 seconds + 2: Time to load utils op: 0.003949642181396484 seconds + 2: +14: Time to load utils op: 0.003612995147705078 seconds + 1: Time to load utils op: 0.0003991127014160156 seconds + 2: Time to load utils op: 0.000476837158203125 seconds +29: Time to load utils op: 0.006644487380981445 seconds + 7: Time to load utils op: 0.0038776397705078125 seconds +14: Time to load utils op: 0.00043129920959472656 secondsTime to load utils op: 0.0004754066467285156 seconds +14: +29: Time to load utils op: 0.003953456878662109 secondsTime to load utils op: 0.003983020782470703 seconds +29: +29: Time to load utils op: 0.00041222572326660156 seconds +21: Time to load utils op: 0.00638270378112793 seconds + 7: Time to load utils op: 0.0005118846893310547 secondsTime to load utils op: 0.00046753883361816406 seconds + 7: +26: Time to load utils op: 0.0004811286926269531 seconds +26: Time to load utils op: 0.0004639625549316406 seconds +14: Time to load utils op: 0.0005307197570800781 seconds +19: Time to load utils op: 0.004081249237060547 seconds + 5: Time to load utils op: 0.004158496856689453 seconds +30: Time to load utils op: 0.006590604782104492 seconds +19: Time to load utils op: 0.0003604888916015625 seconds + 5: Time to load utils op: 0.0004744529724121094 seconds +30: Time to load utils op: 0.00039649009704589844 seconds +28: Time to load utils op: 0.0037031173706054688 seconds +21: Time to load utils op: 0.00044226646423339844 seconds + 7: Time to load utils op: 0.0005154609680175781 seconds +28: Time to load utils op: 0.0004725456237792969 seconds +12: Time to load utils op: 0.003931760787963867 seconds +21: Time to load utils op: 0.0004925727844238281 seconds +30: Time to load utils op: 0.0004048347473144531 seconds + 4: Time to load utils op: 0.003997087478637695 seconds +28: Time to load utils op: 0.00043463706970214844 seconds +20: Time to load utils op: 0.003806591033935547 seconds +12: Time to load utils op: 0.0004723072052001953 seconds +12: Time to load utils op: 0.00047469139099121094 seconds + 4: Time to load utils op: 0.0040395259857177734 seconds + 5: Time to load utils op: 0.00036406517028808594 seconds +20: Time to load utils op: 0.00048041343688964844 seconds + 3: Time to load utils op: 0.003889799118041992 seconds +10: Time to load utils op: 0.004094362258911133 seconds +21: Time to load utils op: 0.00042891502380371094 seconds +19: Time to load utils op: 0.00043392181396484375 seconds +28: Time to load utils op: 0.00041604042053222656 seconds +30: Time to load utils op: 0.0004069805145263672 seconds +10: Time to load utils op: 0.0003674030303955078 seconds + 4: Time to load utils op: 0.00047969818115234375 secondsTime to load utils op: 0.0004487037658691406 seconds + 4: + 3: Time to load utils op: 0.00047397613525390625 seconds +10: Time to load utils op: 0.0003616809844970703 seconds +23: Time to load utils op: 0.006626129150390625 seconds +23: Time to load utils op: 0.0004897117614746094 seconds +19: Time to load utils op: 0.0004031658172607422 seconds + 5: Time to load utils op: 0.0004334449768066406 seconds + 8: Time to load utils op: 0.003789663314819336 seconds +23: Time to load utils op: 0.0004134178161621094 seconds +23: Time to load utils op: 0.0004818439483642578 seconds +17: Time to load utils op: 0.006560087203979492 seconds +13: Time to load utils op: 0.0038671493530273438 seconds + 6: Time to load utils op: 0.004065036773681641 secondsTime to load utils op: 0.003954648971557617 seconds + 6: + 3: Time to load utils op: 0.0004038810729980469 seconds +20: Time to load utils op: 0.0004591941833496094 secondsTime to load utils op: 0.000461578369140625 seconds +20: +17: Time to load utils op: 0.003854036331176758 seconds + 6: Time to load utils op: 0.00047588348388671875 seconds +16: Time to load utils op: 0.0038640499114990234 seconds +10: Time to load utils op: 0.00036525726318359375 seconds +24: Time to load utils op: 0.0064814090728759766 secondsTime to load utils op: 0.006481647491455078 seconds +24: +24: Time to load utils op: 0.006426572799682617 seconds +17: Time to load utils op: 0.0004475116729736328 seconds +13: Time to load utils op: 0.0004742145538330078 seconds + 6: Time to load utils op: 0.000476837158203125 seconds +27: Time to load utils op: 0.004036903381347656 seconds +27: Time to load utils op: 0.0041162967681884766 seconds + 8: Time to load utils op: 0.0004928112030029297 seconds +24: Time to load utils op: 0.00657963752746582 seconds +12: Time to load utils op: 0.00034928321838378906 seconds +13: Time to load utils op: 0.0004634857177734375 seconds +25: Time to load utils op: 0.006459712982177734 seconds +25: Time to load utils op: 0.006404876708984375 seconds + 3: Time to load utils op: 0.0004112720489501953 seconds + 8: Time to load utils op: 0.0003268718719482422 seconds +25: Time to load utils op: 0.00040435791015625 seconds +16: Time to load utils op: 0.000476837158203125 seconds +13: Time to load utils op: 0.0003895759582519531 seconds +16: Time to load utils op: 0.00049591064453125 seconds +17: Time to load utils op: 0.0004184246063232422 seconds +25: Time to load utils op: 0.00040793418884277344 seconds +27: Time to load utils op: 0.0004911422729492188 seconds +16: Time to load utils op: 0.00044727325439453125 seconds +27: Time to load utils op: 0.0004413127899169922 seconds + 8: Time to load utils op: 0.00043511390686035156 seconds +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 9: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 9: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 9: [2023-05-10 12:55:25,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +15: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +21: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +27: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +27: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 7: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +27: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +26: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +27: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +15: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +24: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +21: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +21: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +30: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 0: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +15: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +30: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +15: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 1: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 7: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +11: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 3: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +24: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +25: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +23: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 0: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +11: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +25: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +11: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 7: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +23: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +24: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +11: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +11: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 0: [2023-05-10 12:55:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +23: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 7: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 8: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +29: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +14: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 3: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +12: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 5: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +14: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 5: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 3: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +29: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:55:25,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +14: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +14: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +12: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +19: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +12: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +22: [2023-05-10 12:55:25,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +10: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +22: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +22: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +22: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +20: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +16: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +19: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +16: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +10: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +17: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +17: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +18: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +16: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 2: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 6: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 6: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... + 4: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +16: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +20: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +10: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +17: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +10: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +17: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +20: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... + 4: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +20: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +18: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +31: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +18: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. + 2: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. + 2: [2023-05-10 12:55:25,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +18: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt... +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt... +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_00_model_states.pt. +13: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/mp_rank_01_model_states.pt. +13: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +15: [2023-05-10 12:55:25,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 2: [2023-05-10 12:55:25,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +28: [2023-05-10 12:55:25,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +28: [2023-05-10 12:55:25,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +24: [2023-05-10 12:55:25,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 5: [2023-05-10 12:55:25,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 5: [2023-05-10 12:55:25,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +22: [2023-05-10 12:55:25,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 2: [2023-05-10 12:55:25,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +28: [2023-05-10 12:55:25,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:25,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:25,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +15: [2023-05-10 12:55:25,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:25,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:25,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:25,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:25,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +15: [2023-05-10 12:55:25,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:25,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +19: [2023-05-10 12:55:25,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +19: [2023-05-10 12:55:25,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +16: [2023-05-10 12:55:25,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +30: [2023-05-10 12:55:25,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +23: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 9: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +23: [2023-05-10 12:55:25,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +16: [2023-05-10 12:55:25,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:25,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:25,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +22: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +16: [2023-05-10 12:55:25,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:25,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +23: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +22: [2023-05-10 12:55:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:25,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +30: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +10: [2023-05-10 12:55:25,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +30: [2023-05-10 12:55:25,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:25,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +24: [2023-05-10 12:55:25,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:25,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:25,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:25,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +24: [2023-05-10 12:55:25,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:25,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:25,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +25: [2023-05-10 12:55:25,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +31: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 0: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +25: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 0: [2023-05-10 12:55:25,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:25,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:25,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 7: [2023-05-10 12:55:25,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +17: [2023-05-10 12:55:25,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 4: [2023-05-10 12:55:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +31: [2023-05-10 12:55:25,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +19: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +31: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:25,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +25: [2023-05-10 12:55:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 9: [2023-05-10 12:55:25,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:55:25,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +13: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +17: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +11: [2023-05-10 12:55:25,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 4: [2023-05-10 12:55:25,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +10: [2023-05-10 12:55:25,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +17: [2023-05-10 12:55:25,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:25,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +10: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +18: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +18: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +14: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +14: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 3: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +20: [2023-05-10 12:55:25,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +26: [2023-05-10 12:55:25,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +12: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +29: [2023-05-10 12:55:25,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +26: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +29: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +29: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +21: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +27: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +21: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 6: [2023-05-10 12:55:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... +27: [2023-05-10 12:55:25,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +26: [2023-05-10 12:55:25,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:25,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:25,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 6: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt... + 8: [2023-05-10 12:55:25,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt... +13: [2023-05-10 12:55:25,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 1: [2023-05-10 12:55:25,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:25,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +18: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +13: [2023-05-10 12:55:25,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:25,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 3: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:25,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:25,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:25,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:25,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +27: [2023-05-10 12:55:25,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +11: [2023-05-10 12:55:25,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +21: [2023-05-10 12:55:25,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +14: [2023-05-10 12:55:25,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +12: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. + 8: [2023-05-10 12:55:25,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_00-model_states.pt. +20: [2023-05-10 12:55:25,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:25,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +23: [2023-05-10 12:55:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +15: [2023-05-10 12:55:26,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +28: [2023-05-10 12:55:26,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:26,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:26,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:26,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +23: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +16: [2023-05-10 12:55:26,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +16: [2023-05-10 12:55:26,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +16: [2023-05-10 12:55:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +28: [2023-05-10 12:55:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +16: [2023-05-10 12:55:26,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:55:26,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:55:26,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +15: [2023-05-10 12:55:26,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:26,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:26,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +14: [2023-05-10 12:55:26,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +20: [2023-05-10 12:55:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +24: [2023-05-10 12:55:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +15: [2023-05-10 12:55:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +15: [2023-05-10 12:55:26,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:55:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 5: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +24: [2023-05-10 12:55:26,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +24: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +12: [2023-05-10 12:55:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +18: [2023-05-10 12:55:26,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +11: [2023-05-10 12:55:26,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +21: [2023-05-10 12:55:26,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +24: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +25: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +11: [2023-05-10 12:55:26,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +22: [2023-05-10 12:55:26,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +22: [2023-05-10 12:55:26,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +22: [2023-05-10 12:55:26,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +25: [2023-05-10 12:55:26,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +30: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +30: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +27: [2023-05-10 12:55:26,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +25: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +25: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +26: [2023-05-10 12:55:26,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +18: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +11: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +14: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:26,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:26,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +14: [2023-05-10 12:55:26,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +27: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +11: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +18: [2023-05-10 12:55:26,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +18: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 1: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +26: [2023-05-10 12:55:26,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +26: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +20: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +20: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:26,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +30: [2023-05-10 12:55:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +30: [2023-05-10 12:55:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +26: [2023-05-10 12:55:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +19: [2023-05-10 12:55:26,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +29: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +29: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +31: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +27: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +27: [2023-05-10 12:55:26,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +12: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +21: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +14: [2023-05-10 12:55:26,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +10: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 7: [2023-05-10 12:55:26,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 8: [2023-05-10 12:55:26,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +21: [2023-05-10 12:55:26,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +13: [2023-05-10 12:55:26,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +21: [2023-05-10 12:55:26,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +19: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +20: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +12: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +29: [2023-05-10 12:55:26,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +10: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:26,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:26,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +12: [2023-05-10 12:55:26,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +19: [2023-05-10 12:55:26,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +31: [2023-05-10 12:55:26,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +31: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +31: [2023-05-10 12:55:26,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +19: [2023-05-10 12:55:26,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +10: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +28: [2023-05-10 12:55:26,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:55:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +28: [2023-05-10 12:55:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:55:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +10: [2023-05-10 12:55:26,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +17: [2023-05-10 12:55:26,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. +29: [2023-05-10 12:55:26,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_01-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +28: [2023-05-10 12:55:26,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +23: [2023-05-10 12:55:26,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +17: [2023-05-10 12:55:26,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt... +13: [2023-05-10 12:55:26,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +23: [2023-05-10 12:55:26,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:26,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:26,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:26,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +13: [2023-05-10 12:55:26,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +13: [2023-05-10 12:55:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. +17: [2023-05-10 12:55:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... +17: [2023-05-10 12:55:26,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:26,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:26,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:26,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:26,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:26,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:26,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:26,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:26,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +28: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +28: [2023-05-10 12:55:26,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:55:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:55:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +30: [2023-05-10 12:55:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +11: [2023-05-10 12:55:26,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +22: [2023-05-10 12:55:26,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +18: [2023-05-10 12:55:26,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +22: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:26,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +24: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:26,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:26,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +24: [2023-05-10 12:55:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +22: [2023-05-10 12:55:26,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +15: [2023-05-10 12:55:26,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +30: [2023-05-10 12:55:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +18: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +18: [2023-05-10 12:55:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +18: [2023-05-10 12:55:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +15: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +15: [2023-05-10 12:55:26,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +16: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +16: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +30: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +30: [2023-05-10 12:55:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +26: [2023-05-10 12:55:26,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +26: [2023-05-10 12:55:26,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +25: [2023-05-10 12:55:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:26,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 5: [2023-05-10 12:55:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +26: [2023-05-10 12:55:26,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +26: [2023-05-10 12:55:26,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:26,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:26,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 3: [2023-05-10 12:55:26,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:26,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +31: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 0: [2023-05-10 12:55:26,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +20: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +27: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +21: [2023-05-10 12:55:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +23: [2023-05-10 12:55:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +23: [2023-05-10 12:55:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:26,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +27: [2023-05-10 12:55:26,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:26,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:26,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +14: [2023-05-10 12:55:26,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +27: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:55:26,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:55:26,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:26,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:26,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +27: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +12: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +11: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +29: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 1: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +10: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 8: [2023-05-10 12:55:26,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 9: [2023-05-10 12:55:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:26,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +21: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +21: [2023-05-10 12:55:26,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +17: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +13: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. +19: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_03-model_01-model_states.pt. + 6: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +21: [2023-05-10 12:55:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 3: [2023-05-10 12:55:26,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +19: [2023-05-10 12:55:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:26,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +29: [2023-05-10 12:55:26,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:26,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +12: [2023-05-10 12:55:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 1: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 9: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +29: [2023-05-10 12:55:26,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +20: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +20: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +11: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +13: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +17: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +14: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +10: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +12: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +12: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +25: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt... +31: [2023-05-10 12:55:26,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +29: [2023-05-10 12:55:26,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:26,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:26,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +31: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +28: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:26,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 7: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:26,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 7: [2023-05-10 12:55:26,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:26,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +25: [2023-05-10 12:55:26,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:26,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 2: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +19: [2023-05-10 12:55:26,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +25: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +24: [2023-05-10 12:55:26,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +22: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +19: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:26,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +31: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +11: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +16: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +16: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:26,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +11: [2023-05-10 12:55:26,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +10: [2023-05-10 12:55:26,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:26,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:26,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +24: [2023-05-10 12:55:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +20: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +14: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:55:26,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +15: [2023-05-10 12:55:26,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +15: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +23: [2023-05-10 12:55:26,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +13: [2023-05-10 12:55:26,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +23: [2023-05-10 12:55:26,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:26,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +10: [2023-05-10 12:55:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +13: [2023-05-10 12:55:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_00-model_states.pt. +17: [2023-05-10 12:55:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +24: [2023-05-10 12:55:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... +17: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:26,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:26,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:26,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:26,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:26,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:26,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:26,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:26,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +22: [2023-05-10 12:55:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:26,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +22: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:26,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:26,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:26,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:26,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:26,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +28: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:26,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:26,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:26,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:26,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:26,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +15: [2023-05-10 12:55:26,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:26,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:26,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:26,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:26,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:26,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:26,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:26,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:55:26,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:55:26,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:26,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:26,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:26,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:26,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:26,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:26,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +16: [2023-05-10 12:55:26,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +26: [2023-05-10 12:55:26,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:26,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:26,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:26,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +25: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +25: [2023-05-10 12:55:26,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +16: [2023-05-10 12:55:26,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +16: [2023-05-10 12:55:26,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:26,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +26: [2023-05-10 12:55:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:26,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:26,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:55:26,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +30: [2023-05-10 12:55:26,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:26,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:26,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +26: [2023-05-10 12:55:26,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +30: [2023-05-10 12:55:26,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:26,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:26,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:26,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:26,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +26: [2023-05-10 12:55:26,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:26,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:26,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:26,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +30: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:26,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 7: [2023-05-10 12:55:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:26,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:26,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:26,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +30: [2023-05-10 12:55:26,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:26,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:26,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:26,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:26,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:26,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:26,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:26,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:26,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:26,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:26,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:26,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:26,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:26,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:26,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:26,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:26,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:26,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +31: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +23: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +29: [2023-05-10 12:55:27,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:55:27,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +31: [2023-05-10 12:55:27,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +27: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +24: [2023-05-10 12:55:27,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +24: [2023-05-10 12:55:27,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +31: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +12: [2023-05-10 12:55:27,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +31: [2023-05-10 12:55:27,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +27: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +24: [2023-05-10 12:55:27,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +24: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +18: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +20: [2023-05-10 12:55:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +19: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +18: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +18: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +18: [2023-05-10 12:55:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +15: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +15: [2023-05-10 12:55:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +27: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +27: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +20: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +29: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +12: [2023-05-10 12:55:27,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +12: [2023-05-10 12:55:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +29: [2023-05-10 12:55:27,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +20: [2023-05-10 12:55:27,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +12: [2023-05-10 12:55:27,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +14: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +23: [2023-05-10 12:55:27,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +29: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +23: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +20: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +14: [2023-05-10 12:55:27,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +14: [2023-05-10 12:55:27,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +19: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +14: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +10: [2023-05-10 12:55:27,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +23: [2023-05-10 12:55:27,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +11: [2023-05-10 12:55:27,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +23: [2023-05-10 12:55:27,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +23: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +13: [2023-05-10 12:55:27,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +28: [2023-05-10 12:55:27,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +17: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +13: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +13: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +13: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +21: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +28: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +19: [2023-05-10 12:55:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +28: [2023-05-10 12:55:27,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +17: [2023-05-10 12:55:27,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +19: [2023-05-10 12:55:27,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +19: [2023-05-10 12:55:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +10: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +21: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +22: [2023-05-10 12:55:27,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +26: [2023-05-10 12:55:27,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +17: [2023-05-10 12:55:27,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +17: [2023-05-10 12:55:27,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +21: [2023-05-10 12:55:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +22: [2023-05-10 12:55:27,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +21: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +11: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +11: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_04-model_01-model_states.pt. +25: [2023-05-10 12:55:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt... +16: [2023-05-10 12:55:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. +11: [2023-05-10 12:55:27,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt... +25: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +25: [2023-05-10 12:55:27,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +27: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +16: [2023-05-10 12:55:27,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +16: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +22: [2023-05-10 12:55:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +25: [2023-05-10 12:55:27,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +28: [2023-05-10 12:55:27,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:27,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +28: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +31: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +25: [2023-05-10 12:55:27,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +20: [2023-05-10 12:55:27,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +25: [2023-05-10 12:55:27,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +31: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +27: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +31: [2023-05-10 12:55:27,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +16: [2023-05-10 12:55:27,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +28: [2023-05-10 12:55:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +16: [2023-05-10 12:55:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +27: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +28: [2023-05-10 12:55:27,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +22: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +31: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +24: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +24: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +15: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +12: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +15: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +15: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +30: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +29: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +12: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +20: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +30: [2023-05-10 12:55:27,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +26: [2023-05-10 12:55:27,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +12: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +15: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +29: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +18: [2023-05-10 12:55:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +24: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +30: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +26: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:55:27,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +14: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +29: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +20: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +30: [2023-05-10 12:55:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +12: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +18: [2023-05-10 12:55:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +29: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +23: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +20: [2023-05-10 12:55:27,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +18: [2023-05-10 12:55:27,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +18: [2023-05-10 12:55:27,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +10: [2023-05-10 12:55:27,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +14: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +14: [2023-05-10 12:55:27,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +14: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +11: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +13: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +19: [2023-05-10 12:55:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +19: [2023-05-10 12:55:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +10: [2023-05-10 12:55:27,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +11: [2023-05-10 12:55:27,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +13: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +11: [2023-05-10 12:55:27,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +17: [2023-05-10 12:55:27,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +19: [2023-05-10 12:55:27,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +11: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +19: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:27,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +17: [2023-05-10 12:55:27,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +13: [2023-05-10 12:55:27,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. +17: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +17: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_05-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +10: [2023-05-10 12:55:27,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +10: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +13: [2023-05-10 12:55:27,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +21: [2023-05-10 12:55:27,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt... +19: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +27: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +27: [2023-05-10 12:55:27,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +23: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. +21: [2023-05-10 12:55:27,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +21: [2023-05-10 12:55:27,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt... +23: [2023-05-10 12:55:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +24: [2023-05-10 12:55:27,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 3: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +29: [2023-05-10 12:55:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +12: [2023-05-10 12:55:27,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:27,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:27,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:27,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:27,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +30: [2023-05-10 12:55:27,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:27,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +15: [2023-05-10 12:55:27,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +25: [2023-05-10 12:55:27,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +14: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +18: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +28: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +31: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +20: [2023-05-10 12:55:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +16: [2023-05-10 12:55:27,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +31: [2023-05-10 12:55:27,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:27,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:27,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +11: [2023-05-10 12:55:27,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 6: [2023-05-10 12:55:27,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:27,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +10: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +17: [2023-05-10 12:55:27,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:27,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +19: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +21: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:55:27,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 9: [2023-05-10 12:55:27,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +13: [2023-05-10 12:55:27,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +26: [2023-05-10 12:55:27,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +26: [2023-05-10 12:55:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. + 5: [2023-05-10 12:55:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_06-model_01-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +22: [2023-05-10 12:55:27,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +26: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:27,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:27,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +13: [2023-05-10 12:55:27,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:27,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +13: [2023-05-10 12:55:27,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +28: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +28: [2023-05-10 12:55:27,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +21: [2023-05-10 12:55:27,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +23: [2023-05-10 12:55:27,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 1: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +28: [2023-05-10 12:55:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +29: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +25: [2023-05-10 12:55:27,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +27: [2023-05-10 12:55:27,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +29: [2023-05-10 12:55:27,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +29: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +11: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +11: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:27,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +23: [2023-05-10 12:55:27,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:55:27,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +16: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +20: [2023-05-10 12:55:27,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +25: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +23: [2023-05-10 12:55:27,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:27,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +27: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +31: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +25: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +31: [2023-05-10 12:55:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +16: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +16: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +31: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +16: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:27,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:27,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +11: [2023-05-10 12:55:27,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +20: [2023-05-10 12:55:27,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +25: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +25: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +10: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +31: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +31: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +16: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +16: [2023-05-10 12:55:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +25: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +16: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +30: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +17: [2023-05-10 12:55:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +17: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 6: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +18: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +18: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +14: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +12: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +20: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 9: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +19: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 5: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +10: [2023-05-10 12:55:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:27,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +15: [2023-05-10 12:55:27,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +24: [2023-05-10 12:55:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +24: [2023-05-10 12:55:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... +15: [2023-05-10 12:55:27,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +31: [2023-05-10 12:55:27,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:27,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +13: [2023-05-10 12:55:27,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +17: [2023-05-10 12:55:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... +15: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:27,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:27,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 9: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +14: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +24: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +19: [2023-05-10 12:55:27,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +30: [2023-05-10 12:55:27,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:27,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +22: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +21: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +12: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:27,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. +18: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:27,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:27,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:27,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +26: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 2: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:27,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:27,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 1: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +26: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:27,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:27,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:27,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:27,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:27,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 2: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +26: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +26: [2023-05-10 12:55:27,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 1: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +22: [2023-05-10 12:55:27,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 1: [2023-05-10 12:55:27,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +28: [2023-05-10 12:55:27,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 2: [2023-05-10 12:55:27,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:27,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:27,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 8: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +13: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +28: [2023-05-10 12:55:27,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +21: [2023-05-10 12:55:27,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 0: [2023-05-10 12:55:27,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 0: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:27,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:27,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:27,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 0: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 0: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:27,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +22: [2023-05-10 12:55:27,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:27,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +22: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +22: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +29: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:27,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:27,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:27,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 8: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 7: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 8: [2023-05-10 12:55:27,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:27,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:27,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +21: [2023-05-10 12:55:27,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +29: [2023-05-10 12:55:27,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:27,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +28: [2023-05-10 12:55:27,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +28: [2023-05-10 12:55:27,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +13: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:27,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +11: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +27: [2023-05-10 12:55:27,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:27,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:27,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +13: [2023-05-10 12:55:27,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +21: [2023-05-10 12:55:27,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:27,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +21: [2023-05-10 12:55:27,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:27,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +13: [2023-05-10 12:55:27,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:27,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:27,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:27,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +29: [2023-05-10 12:55:27,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:27,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 7: [2023-05-10 12:55:27,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:27,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 4: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 7: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 7: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:27,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:27,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +29: [2023-05-10 12:55:28,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +11: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +27: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +11: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +11: [2023-05-10 12:55:28,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +27: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +27: [2023-05-10 12:55:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:55:28,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +17: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:28,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +17: [2023-05-10 12:55:28,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +20: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +20: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +20: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +20: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +17: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +15: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +10: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +23: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +23: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +10: [2023-05-10 12:55:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +23: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +10: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +10: [2023-05-10 12:55:28,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 3: [2023-05-10 12:55:28,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +24: [2023-05-10 12:55:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +30: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +12: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +19: [2023-05-10 12:55:28,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +18: [2023-05-10 12:55:28,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +14: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +23: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:55:28,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_07-model_01-model_states.pt. +15: [2023-05-10 12:55:28,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +15: [2023-05-10 12:55:28,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +15: [2023-05-10 12:55:28,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +12: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +23: [2023-05-10 12:55:28,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +23: [2023-05-10 12:55:28,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +19: [2023-05-10 12:55:28,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +14: [2023-05-10 12:55:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +30: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +18: [2023-05-10 12:55:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt... +24: [2023-05-10 12:55:28,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:55:28,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +12: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +12: [2023-05-10 12:55:28,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +24: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +14: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +24: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +30: [2023-05-10 12:55:28,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +30: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +19: [2023-05-10 12:55:28,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +19: [2023-05-10 12:55:28,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +25: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +18: [2023-05-10 12:55:28,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_00-model_states.pt. +14: [2023-05-10 12:55:28,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... +18: [2023-05-10 12:55:28,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +16: [2023-05-10 12:55:28,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +16: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +31: [2023-05-10 12:55:28,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:28,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:28,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:28,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +22: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +25: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +22: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +25: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +28: [2023-05-10 12:55:28,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +28: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +22: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +22: [2023-05-10 12:55:28,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:28,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:28,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:28,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:28,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +23: [2023-05-10 12:55:28,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:55:28,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +31: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:28,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:28,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +23: [2023-05-10 12:55:28,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +23: [2023-05-10 12:55:28,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:28,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:28,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:28,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:28,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +31: [2023-05-10 12:55:28,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:28,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:28,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:28,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:28,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +22: [2023-05-10 12:55:28,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +28: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:28,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:28,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +20: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:28,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +28: [2023-05-10 12:55:28,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:28,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +25: [2023-05-10 12:55:28,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +28: [2023-05-10 12:55:28,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:28,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:28,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:28,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +27: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:28,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +31: [2023-05-10 12:55:28,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +29: [2023-05-10 12:55:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +31: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:28,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +29: [2023-05-10 12:55:28,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:28,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:28,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +25: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +25: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +29: [2023-05-10 12:55:28,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:28,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +27: [2023-05-10 12:55:28,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +21: [2023-05-10 12:55:28,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:28,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:28,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:28,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:28,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:28,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:28,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:28,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:28,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:28,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:55:28,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:28,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:28,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:28,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:28,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:28,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +28: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:28,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:28,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:28,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:28,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:28,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:28,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:28,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:28,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:28,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:28,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:28,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:28,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:28,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:28,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:28,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:28,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:28,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:28,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +23: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:28,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:28,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:28,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:28,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:28,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:28,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:28,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +16: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:28,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +22: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:28,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +25: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 1: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +28: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +11: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:28,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +21: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:28,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:28,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:28,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +28: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +11: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +19: [2023-05-10 12:55:28,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:28,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +18: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:28,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +25: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +26: [2023-05-10 12:55:28,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +28: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:28,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +31: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:28,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:28,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +16: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:28,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:28,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:28,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 0: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:28,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:28,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:28,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +28: [2023-05-10 12:55:28,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 1: [2023-05-10 12:55:28,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +21: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:28,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +11: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +24: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +16: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +27: [2023-05-10 12:55:29,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:29,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:55:29,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:55:29,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +21: [2023-05-10 12:55:29,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +11: [2023-05-10 12:55:29,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +15: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:29,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +19: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +19: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:29,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +17: [2023-05-10 12:55:29,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +31: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +27: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +17: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +18: [2023-05-10 12:55:29,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +31: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +10: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +24: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +24: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +19: [2023-05-10 12:55:29,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +24: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:29,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +12: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +29: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +17: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +18: [2023-05-10 12:55:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:29,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:29,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +27: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:29,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:29,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:29,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +10: [2023-05-10 12:55:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:29,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +18: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:29,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +12: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +17: [2023-05-10 12:55:29,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:55:29,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +17: [2023-05-10 12:55:29,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:29,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +17: [2023-05-10 12:55:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:29,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:29,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:29,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:29,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +10: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +10: [2023-05-10 12:55:29,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +12: [2023-05-10 12:55:29,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +12: [2023-05-10 12:55:29,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +20: [2023-05-10 12:55:29,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +14: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +26: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_08-model_01-model_states.pt. +30: [2023-05-10 12:55:29,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:29,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:29,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:29,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +30: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +20: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +14: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +15: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +13: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt... +26: [2023-05-10 12:55:29,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:29,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +26: [2023-05-10 12:55:29,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +23: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +15: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:29,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +26: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +13: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +26: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:29,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +26: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:29,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +30: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +23: [2023-05-10 12:55:29,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +20: [2023-05-10 12:55:29,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +20: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:29,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. +14: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +13: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +30: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt... +27: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +15: [2023-05-10 12:55:29,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +25: [2023-05-10 12:55:29,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:29,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +21: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:29,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:29,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:29,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:29,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:29,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +21: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:29,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:29,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:29,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:55:29,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +19: [2023-05-10 12:55:29,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +11: [2023-05-10 12:55:29,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:29,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +24: [2023-05-10 12:55:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:29,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:29,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +19: [2023-05-10 12:55:29,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:29,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:29,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +24: [2023-05-10 12:55:29,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:29,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +11: [2023-05-10 12:55:29,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:29,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:29,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:29,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:29,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +16: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:29,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +19: [2023-05-10 12:55:29,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:29,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:29,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:29,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:29,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:29,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +18: [2023-05-10 12:55:29,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:29,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +10: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +13: [2023-05-10 12:55:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +13: [2023-05-10 12:55:29,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +13: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +22: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +18: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:29,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:29,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +15: [2023-05-10 12:55:29,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +10: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +15: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +15: [2023-05-10 12:55:29,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +22: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +10: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +23: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +23: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +31: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +28: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +19: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +22: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +26: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:29,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +28: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +16: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +20: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +13: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +21: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:29,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +16: [2023-05-10 12:55:29,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +17: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +30: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 6: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +12: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +17: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:29,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +14: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +29: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +25: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +23: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +25: [2023-05-10 12:55:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:29,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +25: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +25: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +22: [2023-05-10 12:55:29,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:55:29,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +22: [2023-05-10 12:55:29,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +23: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +30: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +14: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +29: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +12: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +16: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +16: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 7: [2023-05-10 12:55:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:29,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +24: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +24: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +28: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +20: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +17: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:29,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +16: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:29,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +27: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +30: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +26: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +27: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:29,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:29,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +12: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +12: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +14: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +14: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:29,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:29,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:29,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +18: [2023-05-10 12:55:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +28: [2023-05-10 12:55:29,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +28: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 6: [2023-05-10 12:55:29,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +11: [2023-05-10 12:55:29,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_09-model_01-model_states.pt. +10: [2023-05-10 12:55:29,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt... +11: [2023-05-10 12:55:29,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +29: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +29: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:29,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +30: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +25: [2023-05-10 12:55:29,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:29,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +21: [2023-05-10 12:55:29,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_00-model_states.pt. +16: [2023-05-10 12:55:29,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt... +21: [2023-05-10 12:55:29,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +21: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:29,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +21: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +17: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:29,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +29: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +29: [2023-05-10 12:55:29,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +17: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:29,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +29: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +29: [2023-05-10 12:55:29,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:29,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:29,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +31: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:29,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +23: [2023-05-10 12:55:29,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:29,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +26: [2023-05-10 12:55:29,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:29,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:55:29,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +21: [2023-05-10 12:55:29,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:29,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +26: [2023-05-10 12:55:29,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +21: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:29,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +13: [2023-05-10 12:55:29,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:29,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:29,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:29,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +21: [2023-05-10 12:55:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:29,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:29,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:29,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:29,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:29,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +17: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:29,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +23: [2023-05-10 12:55:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:29,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:29,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:29,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 5: [2023-05-10 12:55:29,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:29,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:29,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:55:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +22: [2023-05-10 12:55:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:55:29,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:29,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:29,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:29,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:29,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:29,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:29,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 4: [2023-05-10 12:55:29,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:29,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +16: [2023-05-10 12:55:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:29,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:29,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:29,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:29,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +25: [2023-05-10 12:55:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:29,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:29,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:29,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:29,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +31: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:29,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:29,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +16: [2023-05-10 12:55:29,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:29,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:29,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:29,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:29,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:29,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:29,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:29,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +31: [2023-05-10 12:55:29,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:29,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:29,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:29,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:29,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +28: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:29,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:29,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +17: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:29,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:29,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:29,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:29,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:29,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:29,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:29,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 2: [2023-05-10 12:55:29,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:29,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:29,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:29,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:29,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 0: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +27: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:29,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +21: [2023-05-10 12:55:29,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:29,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:29,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 0: [2023-05-10 12:55:29,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:29,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +16: [2023-05-10 12:55:29,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:29,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:29,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:29,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:29,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:29,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:29,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:29,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:29,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +26: [2023-05-10 12:55:29,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:29,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:29,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:29,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:29,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:29,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +22: [2023-05-10 12:55:29,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:29,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:29,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:29,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:29,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:29,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:29,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:29,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:29,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:29,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:29,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:29,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:29,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +26: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:29,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:29,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:29,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 5: [2023-05-10 12:55:29,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:29,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:29,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:29,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:29,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:29,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +15: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:29,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +17: [2023-05-10 12:55:29,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:29,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:29,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:29,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 8: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:29,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:29,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:29,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:29,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:29,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:29,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:29,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:29,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +17: [2023-05-10 12:55:29,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:29,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +23: [2023-05-10 12:55:29,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:29,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:29,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:55:29,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +24: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +19: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:29,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +23: [2023-05-10 12:55:29,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:29,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:29,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:29,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:29,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:29,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 8: [2023-05-10 12:55:29,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:29,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:55:29,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:29,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +24: [2023-05-10 12:55:29,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:29,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +15: [2023-05-10 12:55:29,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:29,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:29,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +23: [2023-05-10 12:55:29,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:29,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:29,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +23: [2023-05-10 12:55:29,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +23: [2023-05-10 12:55:29,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:55:29,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:29,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:29,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +24: [2023-05-10 12:55:29,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:30,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:30,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:30,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:30,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +27: [2023-05-10 12:55:30,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +28: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +16: [2023-05-10 12:55:30,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +31: [2023-05-10 12:55:30,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +12: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +27: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +27: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +22: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +16: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:30,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:30,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +12: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:30,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +22: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +27: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:55:30,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +22: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +16: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +22: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +12: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +22: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +12: [2023-05-10 12:55:30,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +28: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +31: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +31: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +21: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +29: [2023-05-10 12:55:30,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +17: [2023-05-10 12:55:30,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +21: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +30: [2023-05-10 12:55:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +29: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +29: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +17: [2023-05-10 12:55:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +26: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +13: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +25: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +11: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +29: [2023-05-10 12:55:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:30,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:30,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +20: [2023-05-10 12:55:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +26: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +13: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +26: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +27: [2023-05-10 12:55:30,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +26: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:30,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:30,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +23: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +27: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +20: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +20: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +20: [2023-05-10 12:55:30,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +30: [2023-05-10 12:55:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +25: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +15: [2023-05-10 12:55:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +13: [2023-05-10 12:55:30,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +14: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +25: [2023-05-10 12:55:30,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:30,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +14: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +14: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +27: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +18: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +30: [2023-05-10 12:55:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:30,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:30,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +14: [2023-05-10 12:55:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +10: [2023-05-10 12:55:30,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:30,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +10: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +18: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +19: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:30,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +19: [2023-05-10 12:55:30,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:30,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +30: [2023-05-10 12:55:30,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:30,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +30: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +19: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +19: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:30,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +18: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +18: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:30,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:30,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:55:30,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:55:30,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:30,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +15: [2023-05-10 12:55:30,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:30,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_10-model_01-model_states.pt. +10: [2023-05-10 12:55:30,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +10: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +11: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:30,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt... +11: [2023-05-10 12:55:30,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:30,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:30,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +10: [2023-05-10 12:55:30,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. +11: [2023-05-10 12:55:30,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:30,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:30,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... +10: [2023-05-10 12:55:30,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:30,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:30,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:30,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +11: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +24: [2023-05-10 12:55:30,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:30,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +24: [2023-05-10 12:55:30,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +11: [2023-05-10 12:55:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +11: [2023-05-10 12:55:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:55:30,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +24: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +22: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +12: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +20: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +13: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +12: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +13: [2023-05-10 12:55:30,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +22: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +16: [2023-05-10 12:55:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +20: [2023-05-10 12:55:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +12: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +12: [2023-05-10 12:55:30,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:30,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +21: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +20: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +20: [2023-05-10 12:55:30,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +13: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +16: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +26: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:30,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:30,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +30: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:30,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +16: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +27: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +18: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +27: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +19: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +19: [2023-05-10 12:55:30,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:30,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +14: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +14: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:30,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +30: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +19: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +27: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +18: [2023-05-10 12:55:30,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +10: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:30,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +15: [2023-05-10 12:55:30,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +20: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +17: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:30,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +14: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:30,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +10: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_11-model_01-model_states.pt. +15: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +15: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +19: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +30: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +27: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:30,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +14: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:30,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +24: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +17: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +10: [2023-05-10 12:55:30,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +15: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +15: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +27: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +10: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +27: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +27: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. +18: [2023-05-10 12:55:30,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +27: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... +19: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:30,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:30,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +30: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +17: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +24: [2023-05-10 12:55:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:30,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:30,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +19: [2023-05-10 12:55:30,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +31: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:30,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:30,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +24: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +31: [2023-05-10 12:55:30,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +13: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt... +11: [2023-05-10 12:55:30,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +31: [2023-05-10 12:55:30,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +15: [2023-05-10 12:55:30,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +31: [2023-05-10 12:55:30,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +13: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +23: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +20: [2023-05-10 12:55:30,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +12: [2023-05-10 12:55:30,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +15: [2023-05-10 12:55:30,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +23: [2023-05-10 12:55:30,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +13: [2023-05-10 12:55:30,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +13: [2023-05-10 12:55:30,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +25: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +21: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +20: [2023-05-10 12:55:30,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +28: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +22: [2023-05-10 12:55:30,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +28: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +16: [2023-05-10 12:55:30,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +17: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +21: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +21: [2023-05-10 12:55:30,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +28: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +23: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +29: [2023-05-10 12:55:30,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +30: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +30: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +30: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +16: [2023-05-10 12:55:30,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +15: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +29: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +29: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +22: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +20: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +26: [2023-05-10 12:55:30,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +28: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +25: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +29: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +22: [2023-05-10 12:55:30,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +16: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +16: [2023-05-10 12:55:30,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +26: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +28: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +10: [2023-05-10 12:55:30,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +26: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +23: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +18: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +21: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +26: [2023-05-10 12:55:30,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +21: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +19: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +14: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +17: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +17: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +28: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +22: [2023-05-10 12:55:30,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +11: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_12-model_01-model_states.pt. +14: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +25: [2023-05-10 12:55:30,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +11: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +25: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +19: [2023-05-10 12:55:30,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +12: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:55:30,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt... +18: [2023-05-10 12:55:30,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +18: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +25: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +25: [2023-05-10 12:55:30,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +14: [2023-05-10 12:55:30,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +14: [2023-05-10 12:55:30,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +14: [2023-05-10 12:55:30,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +18: [2023-05-10 12:55:30,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +12: [2023-05-10 12:55:30,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +15: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +11: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +18: [2023-05-10 12:55:30,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +10: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +19: [2023-05-10 12:55:30,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +10: [2023-05-10 12:55:30,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +12: [2023-05-10 12:55:30,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_00-model_states.pt. +27: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt... +11: [2023-05-10 12:55:30,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +31: [2023-05-10 12:55:30,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:30,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:30,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +23: [2023-05-10 12:55:30,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +24: [2023-05-10 12:55:30,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +23: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +24: [2023-05-10 12:55:30,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:30,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:30,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +27: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +24: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +24: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +31: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +31: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +31: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +27: [2023-05-10 12:55:30,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +31: [2023-05-10 12:55:30,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +15: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +27: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +13: [2023-05-10 12:55:30,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +20: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +13: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +13: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +18: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +13: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +15: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +20: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +31: [2023-05-10 12:55:30,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:30,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +30: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +31: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +23: [2023-05-10 12:55:30,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +18: [2023-05-10 12:55:30,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +15: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +20: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +20: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +19: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +10: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +29: [2023-05-10 12:55:30,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +11: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +29: [2023-05-10 12:55:30,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:30,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:30,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:30,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:30,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +11: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +11: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +18: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +30: [2023-05-10 12:55:30,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +14: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +11: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_13-model_01-model_states.pt. +12: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +21: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +12: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +12: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +17: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +28: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +26: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +19: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +14: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... +10: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +11: [2023-05-10 12:55:30,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +15: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +10: [2023-05-10 12:55:30,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +12: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:30,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +25: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +25: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +25: [2023-05-10 12:55:30,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:30,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +15: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +11: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +31: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +10: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +19: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +19: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +17: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +17: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +21: [2023-05-10 12:55:30,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +11: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +14: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +25: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +15: [2023-05-10 12:55:30,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_00-model_states.pt. +22: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt... +16: [2023-05-10 12:55:30,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:30,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:55:30,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:30,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:30,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:30,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:30,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +16: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:55:30,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:30,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +26: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +29: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +26: [2023-05-10 12:55:30,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:30,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +17: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +26: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +29: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +26: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +25: [2023-05-10 12:55:30,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +29: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +13: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +17: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +16: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:30,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +24: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +29: [2023-05-10 12:55:30,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +26: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +13: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +24: [2023-05-10 12:55:30,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +29: [2023-05-10 12:55:30,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +26: [2023-05-10 12:55:30,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +18: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:30,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:30,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +26: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +29: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:30,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +17: [2023-05-10 12:55:30,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:30,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:30,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +28: [2023-05-10 12:55:30,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:30,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:30,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +21: [2023-05-10 12:55:30,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 3: [2023-05-10 12:55:30,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +24: [2023-05-10 12:55:30,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +24: [2023-05-10 12:55:30,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +13: [2023-05-10 12:55:30,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:30,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +13: [2023-05-10 12:55:30,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +28: [2023-05-10 12:55:30,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +28: [2023-05-10 12:55:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 0: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +20: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 7: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +10: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +20: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +21: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +21: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +28: [2023-05-10 12:55:30,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +22: [2023-05-10 12:55:30,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +10: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +22: [2023-05-10 12:55:30,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 8: [2023-05-10 12:55:30,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +30: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +20: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +20: [2023-05-10 12:55:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 7: [2023-05-10 12:55:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:30,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:30,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +10: [2023-05-10 12:55:30,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +10: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 1: [2023-05-10 12:55:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +22: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:55:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:30,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +30: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:30,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:30,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:30,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. + 6: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +14: [2023-05-10 12:55:30,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +18: [2023-05-10 12:55:30,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +12: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +11: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_14-model_01-model_states.pt. +23: [2023-05-10 12:55:30,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +23: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +30: [2023-05-10 12:55:30,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +30: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:30,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +30: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 9: [2023-05-10 12:55:30,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +14: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +12: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt... +15: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:30,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:30,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 9: [2023-05-10 12:55:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +12: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +23: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +27: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +12: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +27: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +14: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +23: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +27: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +21: [2023-05-10 12:55:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +19: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +14: [2023-05-10 12:55:30,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +18: [2023-05-10 12:55:30,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. +18: [2023-05-10 12:55:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:30,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +22: [2023-05-10 12:55:30,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... + 6: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +15: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:30,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:30,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +19: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +22: [2023-05-10 12:55:30,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt... +27: [2023-05-10 12:55:30,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:30,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:30,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:30,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:30,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:30,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:30,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:30,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:30,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +24: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 1: [2023-05-10 12:55:30,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:30,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:30,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:30,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:30,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +19: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:30,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +11: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +27: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +19: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:30,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +24: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +25: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 1: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +23: [2023-05-10 12:55:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:30,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:30,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +17: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:30,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:30,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:30,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:30,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +20: [2023-05-10 12:55:30,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +25: [2023-05-10 12:55:30,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +31: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +13: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +19: [2023-05-10 12:55:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +11: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +11: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +19: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 5: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +29: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:30,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:30,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:30,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:30,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:30,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +11: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +24: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +16: [2023-05-10 12:55:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +24: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +20: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 4: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:30,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 3: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 2: [2023-05-10 12:55:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +24: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:30,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:30,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 5: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +16: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:30,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +13: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +27: [2023-05-10 12:55:30,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:30,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:30,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +27: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:30,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:30,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 4: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:30,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +25: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:30,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +25: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +16: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +20: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +13: [2023-05-10 12:55:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +29: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +29: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +26: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +25: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +29: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +13: [2023-05-10 12:55:31,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +20: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +31: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +31: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +29: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +17: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:55:31,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +16: [2023-05-10 12:55:31,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +31: [2023-05-10 12:55:31,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +31: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +31: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +17: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +30: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +28: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +12: [2023-05-10 12:55:31,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +14: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +18: [2023-05-10 12:55:31,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +10: [2023-05-10 12:55:31,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_15-model_01-model_states.pt. +21: [2023-05-10 12:55:31,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +22: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:31,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:31,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:31,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +14: [2023-05-10 12:55:31,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:31,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +10: [2023-05-10 12:55:31,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +12: [2023-05-10 12:55:31,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +18: [2023-05-10 12:55:31,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt... +21: [2023-05-10 12:55:31,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +22: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +28: [2023-05-10 12:55:31,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +14: [2023-05-10 12:55:31,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:31,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +14: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:31,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +12: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +21: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +28: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +12: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +18: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +15: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... +10: [2023-05-10 12:55:31,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +10: [2023-05-10 12:55:31,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +15: [2023-05-10 12:55:31,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:55:31,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +18: [2023-05-10 12:55:31,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +15: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:55:31,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_00-model_states.pt. +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +21: [2023-05-10 12:55:31,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +21: [2023-05-10 12:55:31,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +22: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +22: [2023-05-10 12:55:31,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +24: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +28: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +19: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +21: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +30: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +21: [2023-05-10 12:55:31,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +11: [2023-05-10 12:55:31,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:55:31,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +11: [2023-05-10 12:55:31,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +30: [2023-05-10 12:55:31,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +28: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +16: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +16: [2023-05-10 12:55:31,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +30: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:55:31,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +28: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +30: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +19: [2023-05-10 12:55:31,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +16: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +19: [2023-05-10 12:55:31,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:55:31,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +15: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +23: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +20: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +27: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:55:31,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +14: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +18: [2023-05-10 12:55:31,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +13: [2023-05-10 12:55:31,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +19: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +18: [2023-05-10 12:55:31,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +20: [2023-05-10 12:55:31,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +13: [2023-05-10 12:55:31,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +15: [2023-05-10 12:55:31,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +27: [2023-05-10 12:55:31,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +14: [2023-05-10 12:55:31,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +24: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +24: [2023-05-10 12:55:31,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +20: [2023-05-10 12:55:31,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +15: [2023-05-10 12:55:31,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +13: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +25: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +27: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +24: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +20: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +14: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +18: [2023-05-10 12:55:31,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +17: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +13: [2023-05-10 12:55:31,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +26: [2023-05-10 12:55:31,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +26: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +17: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +26: [2023-05-10 12:55:31,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +10: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +25: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:55:31,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:55:31,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:55:31,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +12: [2023-05-10 12:55:31,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_16-model_01-model_states.pt. +25: [2023-05-10 12:55:31,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +25: [2023-05-10 12:55:31,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +10: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +12: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +23: [2023-05-10 12:55:31,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:31,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:31,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:31,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... +25: [2023-05-10 12:55:31,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:31,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +23: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +23: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:31,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +11: [2023-05-10 12:55:31,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +11: [2023-05-10 12:55:31,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +25: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +10: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:31,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +23: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. +12: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +25: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +10: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +12: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... +29: [2023-05-10 12:55:31,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:31,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +31: [2023-05-10 12:55:31,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:31,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:31,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:31,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:31,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +16: [2023-05-10 12:55:31,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +29: [2023-05-10 12:55:31,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +29: [2023-05-10 12:55:31,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:31,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:31,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:31,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:31,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +15: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +31: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +31: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +29: [2023-05-10 12:55:31,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +29: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:31,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +31: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +15: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +19: [2023-05-10 12:55:31,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +15: [2023-05-10 12:55:31,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:31,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:31,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:31,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:31,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:31,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +21: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +20: [2023-05-10 12:55:31,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +30: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:31,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +19: [2023-05-10 12:55:31,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +21: [2023-05-10 12:55:31,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:31,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:31,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +11: [2023-05-10 12:55:31,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +17: [2023-05-10 12:55:31,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:31,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +11: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +20: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +20: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +20: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:31,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +22: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +22: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:31,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +20: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +30: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +22: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +22: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:31,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +24: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +10: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +17: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +21: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +21: [2023-05-10 12:55:31,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:31,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +11: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +28: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +14: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +14: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +11: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +21: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +19: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +17: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +26: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +18: [2023-05-10 12:55:31,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +13: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +18: [2023-05-10 12:55:31,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +17: [2023-05-10 12:55:31,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +28: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +13: [2023-05-10 12:55:31,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +26: [2023-05-10 12:55:31,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +26: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +20: [2023-05-10 12:55:31,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +28: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +13: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +13: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +23: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +14: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +28: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +24: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:31,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +14: [2023-05-10 12:55:31,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +26: [2023-05-10 12:55:31,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +18: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +18: [2023-05-10 12:55:31,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:31,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +10: [2023-05-10 12:55:31,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +12: [2023-05-10 12:55:31,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:31,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_17-model_01-model_states.pt. +23: [2023-05-10 12:55:31,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +16: [2023-05-10 12:55:31,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:31,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +23: [2023-05-10 12:55:31,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +12: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +16: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +10: [2023-05-10 12:55:31,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt... +24: [2023-05-10 12:55:31,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +16: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +27: [2023-05-10 12:55:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +27: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +12: [2023-05-10 12:55:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:31,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +24: [2023-05-10 12:55:31,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_00-model_states.pt. +10: [2023-05-10 12:55:31,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +10: [2023-05-10 12:55:31,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt... +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +23: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:31,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +29: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +27: [2023-05-10 12:55:31,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:31,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:31,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:31,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:31,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +15: [2023-05-10 12:55:31,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +25: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +31: [2023-05-10 12:55:31,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:31,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +29: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:31,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +15: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:31,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:31,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:31,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +15: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +13: [2023-05-10 12:55:31,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +15: [2023-05-10 12:55:31,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:31,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:31,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +17: [2023-05-10 12:55:31,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:31,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +31: [2023-05-10 12:55:31,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:31,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:31,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:31,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +17: [2023-05-10 12:55:31,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:31,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:31,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:31,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:31,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 7: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:31,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:31,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:31,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +26: [2023-05-10 12:55:31,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +19: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 3: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:31,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:31,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +11: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +21: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:31,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +28: [2023-05-10 12:55:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +20: [2023-05-10 12:55:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:31,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:55:31,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +18: [2023-05-10 12:55:31,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 5: [2023-05-10 12:55:31,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +19: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +19: [2023-05-10 12:55:31,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +19: [2023-05-10 12:55:31,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:31,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +20: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +11: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 2: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 1: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:31,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 1: [2023-05-10 12:55:31,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:31,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 1: [2023-05-10 12:55:31,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +28: [2023-05-10 12:55:31,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +28: [2023-05-10 12:55:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +18: [2023-05-10 12:55:31,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +18: [2023-05-10 12:55:31,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:31,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:31,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:31,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +22: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +18: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:31,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +22: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +30: [2023-05-10 12:55:31,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:31,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 9: [2023-05-10 12:55:31,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +26: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +26: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:31,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +30: [2023-05-10 12:55:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +17: [2023-05-10 12:55:31,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 5: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +20: [2023-05-10 12:55:31,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:31,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:31,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:31,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 5: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:31,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +20: [2023-05-10 12:55:31,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:31,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:31,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:31,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:31,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +30: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +22: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +26: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 7: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:31,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +30: [2023-05-10 12:55:31,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:31,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +16: [2023-05-10 12:55:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +13: [2023-05-10 12:55:31,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +24: [2023-05-10 12:55:31,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +23: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:31,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:55:31,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +12: [2023-05-10 12:55:31,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 6: [2023-05-10 12:55:31,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +13: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +21: [2023-05-10 12:55:31,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 8: [2023-05-10 12:55:31,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:31,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:31,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +16: [2023-05-10 12:55:31,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:31,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +12: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +24: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +24: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +31: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +31: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +31: [2023-05-10 12:55:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +24: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 8: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +23: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:31,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 8: [2023-05-10 12:55:31,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +16: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:55:31,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +15: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +23: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:31,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:31,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +12: [2023-05-10 12:55:31,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:31,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +31: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +12: [2023-05-10 12:55:31,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +16: [2023-05-10 12:55:31,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +23: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +25: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:31,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +23: [2023-05-10 12:55:31,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +16: [2023-05-10 12:55:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:31,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +16: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +16: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +13: [2023-05-10 12:55:31,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +25: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:31,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +21: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +25: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:31,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:31,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:31,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:31,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +23: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:31,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:31,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:31,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:31,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:31,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:31,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +14: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. +10: [2023-05-10 12:55:31,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_18-model_01-model_states.pt. + 4: [2023-05-10 12:55:31,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:31,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 4: [2023-05-10 12:55:31,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +27: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:31,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... +14: [2023-05-10 12:55:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:55:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:31,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +10: [2023-05-10 12:55:31,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +10: [2023-05-10 12:55:31,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:55:31,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +14: [2023-05-10 12:55:31,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +14: [2023-05-10 12:55:31,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:31,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:31,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:31,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:31,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:31,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +29: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +29: [2023-05-10 12:55:31,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:31,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_00-model_states.pt. +27: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:31,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt... +27: [2023-05-10 12:55:31,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:31,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:31,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:31,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:31,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 1: [2023-05-10 12:55:31,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:31,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:55:31,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:31,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:31,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:31,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:31,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:31,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:55:32,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +29: [2023-05-10 12:55:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:32,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +18: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:32,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:32,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:32,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:32,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:32,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:32,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +17: [2023-05-10 12:55:32,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:32,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:32,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:32,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:32,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:32,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:32,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:32,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +20: [2023-05-10 12:55:32,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +20: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:32,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:32,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +17: [2023-05-10 12:55:32,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +22: [2023-05-10 12:55:32,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +30: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +20: [2023-05-10 12:55:32,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +20: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +21: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +30: [2023-05-10 12:55:32,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +22: [2023-05-10 12:55:32,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +28: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +22: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +22: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +30: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +11: [2023-05-10 12:55:32,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +30: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +12: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +13: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +15: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:32,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:32,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +11: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:32,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +28: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +25: [2023-05-10 12:55:32,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +13: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +18: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +26: [2023-05-10 12:55:32,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +19: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +21: [2023-05-10 12:55:32,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +18: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +14: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +18: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +19: [2023-05-10 12:55:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +25: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +12: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +12: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +11: [2023-05-10 12:55:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +24: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +19: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +26: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:32,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +27: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +25: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +13: [2023-05-10 12:55:32,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +12: [2023-05-10 12:55:32,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +13: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +28: [2023-05-10 12:55:32,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +28: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +21: [2023-05-10 12:55:32,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +21: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +16: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +16: [2023-05-10 12:55:32,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:32,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +29: [2023-05-10 12:55:32,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:32,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +16: [2023-05-10 12:55:32,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +29: [2023-05-10 12:55:32,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +27: [2023-05-10 12:55:32,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +10: [2023-05-10 12:55:32,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +24: [2023-05-10 12:55:32,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +10: [2023-05-10 12:55:32,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +14: [2023-05-10 12:55:32,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_19-model_01-model_states.pt. +29: [2023-05-10 12:55:32,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +29: [2023-05-10 12:55:32,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:32,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +14: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +24: [2023-05-10 12:55:32,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:32,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt... +27: [2023-05-10 12:55:32,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:32,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +27: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +10: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +29: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +15: [2023-05-10 12:55:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +29: [2023-05-10 12:55:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +10: [2023-05-10 12:55:32,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +31: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +23: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +14: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +27: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +24: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:32,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +24: [2023-05-10 12:55:32,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +23: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +31: [2023-05-10 12:55:32,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +27: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:32,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_00-model_states.pt. +15: [2023-05-10 12:55:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt... +15: [2023-05-10 12:55:32,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +25: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +15: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +27: [2023-05-10 12:55:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +31: [2023-05-10 12:55:32,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +31: [2023-05-10 12:55:32,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +23: [2023-05-10 12:55:32,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +18: [2023-05-10 12:55:32,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:32,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +17: [2023-05-10 12:55:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +19: [2023-05-10 12:55:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:32,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +17: [2023-05-10 12:55:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +19: [2023-05-10 12:55:32,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:32,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:32,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:32,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:32,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +23: [2023-05-10 12:55:32,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +17: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +17: [2023-05-10 12:55:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +23: [2023-05-10 12:55:32,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +29: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +31: [2023-05-10 12:55:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:32,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:32,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +30: [2023-05-10 12:55:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +15: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +22: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +22: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +26: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +26: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:32,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +14: [2023-05-10 12:55:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +30: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +30: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +20: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +12: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +28: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +28: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +13: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +30: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +24: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +18: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +26: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +18: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +11: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +22: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +22: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +13: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +18: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +21: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +10: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_20-model_01-model_states.pt. +20: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +28: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +20: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +24: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +22: [2023-05-10 12:55:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +25: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +14: [2023-05-10 12:55:32,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +25: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +11: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +19: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +10: [2023-05-10 12:55:32,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +21: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +24: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt... +12: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +12: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +14: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +14: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +25: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +16: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +20: [2023-05-10 12:55:32,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +24: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +26: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +11: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +28: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +13: [2023-05-10 12:55:32,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +13: [2023-05-10 12:55:32,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +19: [2023-05-10 12:55:32,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +10: [2023-05-10 12:55:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +12: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +16: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +11: [2023-05-10 12:55:32,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +24: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +24: [2023-05-10 12:55:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +21: [2023-05-10 12:55:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. +10: [2023-05-10 12:55:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +21: [2023-05-10 12:55:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... +16: [2023-05-10 12:55:32,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:32,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +16: [2023-05-10 12:55:32,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +16: [2023-05-10 12:55:32,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:32,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +27: [2023-05-10 12:55:32,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:32,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:32,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +27: [2023-05-10 12:55:32,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +27: [2023-05-10 12:55:32,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 1: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:55:32,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +18: [2023-05-10 12:55:32,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:32,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:32,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:32,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +25: [2023-05-10 12:55:32,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:32,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:32,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +27: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +31: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +31: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +17: [2023-05-10 12:55:32,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:55:32,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +31: [2023-05-10 12:55:32,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +31: [2023-05-10 12:55:32,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +18: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +25: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +26: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:32,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +23: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +18: [2023-05-10 12:55:32,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +18: [2023-05-10 12:55:32,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +25: [2023-05-10 12:55:32,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +25: [2023-05-10 12:55:32,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +26: [2023-05-10 12:55:32,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +26: [2023-05-10 12:55:32,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +26: [2023-05-10 12:55:32,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +29: [2023-05-10 12:55:32,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +26: [2023-05-10 12:55:32,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +23: [2023-05-10 12:55:32,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +17: [2023-05-10 12:55:32,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:32,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:32,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:32,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:32,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +29: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 4: [2023-05-10 12:55:32,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 6: [2023-05-10 12:55:32,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +15: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +15: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +29: [2023-05-10 12:55:32,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +29: [2023-05-10 12:55:32,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +19: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:32,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +28: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +15: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +15: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +23: [2023-05-10 12:55:32,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +20: [2023-05-10 12:55:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:32,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +19: [2023-05-10 12:55:32,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +23: [2023-05-10 12:55:32,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +19: [2023-05-10 12:55:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +20: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:55:32,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 4: [2023-05-10 12:55:32,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +28: [2023-05-10 12:55:32,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +19: [2023-05-10 12:55:32,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +14: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +20: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +28: [2023-05-10 12:55:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +20: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +28: [2023-05-10 12:55:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 2: [2023-05-10 12:55:32,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:32,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:32,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:55:32,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +13: [2023-05-10 12:55:32,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +30: [2023-05-10 12:55:32,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:32,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +21: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +30: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +30: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:32,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +12: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +24: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +10: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +30: [2023-05-10 12:55:32,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:32,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 5: [2023-05-10 12:55:32,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +22: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. +11: [2023-05-10 12:55:32,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_21-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:32,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +10: [2023-05-10 12:55:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +13: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +12: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +21: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +11: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +14: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +21: [2023-05-10 12:55:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +22: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +14: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... +24: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +13: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +10: [2023-05-10 12:55:32,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +13: [2023-05-10 12:55:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +21: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +12: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +10: [2023-05-10 12:55:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +14: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... + 5: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +11: [2023-05-10 12:55:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +12: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +22: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_00-model_states.pt. +24: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +24: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +11: [2023-05-10 12:55:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +22: [2023-05-10 12:55:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt... +17: [2023-05-10 12:55:32,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:55:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:32,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:32,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +27: [2023-05-10 12:55:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:32,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:32,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:32,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:32,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:32,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:32,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:32,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:32,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:32,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:32,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +27: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:32,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +27: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:32,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:32,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:32,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:32,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +16: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 3: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:32,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 3: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +30: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +23: [2023-05-10 12:55:32,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:32,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:32,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +16: [2023-05-10 12:55:32,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 3: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:32,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:32,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:32,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:32,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:32,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:32,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:55:32,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +31: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +30: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 1: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:32,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:32,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +16: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +20: [2023-05-10 12:55:32,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +18: [2023-05-10 12:55:32,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:32,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:32,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +16: [2023-05-10 12:55:32,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 1: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 1: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:32,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:32,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:32,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:32,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +23: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:32,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:32,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +20: [2023-05-10 12:55:32,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:32,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:32,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +18: [2023-05-10 12:55:32,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:32,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:32,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:32,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:55:32,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:32,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:32,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:32,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:32,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +18: [2023-05-10 12:55:32,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:32,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:32,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +23: [2023-05-10 12:55:32,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +29: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:32,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +23: [2023-05-10 12:55:32,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:32,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +20: [2023-05-10 12:55:32,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +20: [2023-05-10 12:55:32,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:32,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:32,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 7: [2023-05-10 12:55:32,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:32,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +25: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +15: [2023-05-10 12:55:32,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 9: [2023-05-10 12:55:32,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +26: [2023-05-10 12:55:32,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +29: [2023-05-10 12:55:32,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +15: [2023-05-10 12:55:32,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:32,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:32,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +26: [2023-05-10 12:55:32,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:32,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +29: [2023-05-10 12:55:32,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:32,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:32,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:32,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 7: [2023-05-10 12:55:32,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +26: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +26: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:32,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:32,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:32,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:32,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:32,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 9: [2023-05-10 12:55:32,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:32,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +17: [2023-05-10 12:55:33,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +10: [2023-05-10 12:55:33,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:55:33,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +19: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +28: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:33,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +17: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +31: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +19: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +24: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +24: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +28: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +17: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +13: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +21: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +10: [2023-05-10 12:55:33,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +10: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +10: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +31: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:33,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +24: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +19: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:33,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +24: [2023-05-10 12:55:33,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +28: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +28: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +19: [2023-05-10 12:55:33,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +21: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +30: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +13: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +30: [2023-05-10 12:55:33,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +21: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +13: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +21: [2023-05-10 12:55:33,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +14: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +13: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +11: [2023-05-10 12:55:33,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +11: [2023-05-10 12:55:33,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +14: [2023-05-10 12:55:33,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +25: [2023-05-10 12:55:33,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:55:33,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +14: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +15: [2023-05-10 12:55:33,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +12: [2023-05-10 12:55:33,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +14: [2023-05-10 12:55:33,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:55:33,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +11: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +25: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +15: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +11: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +22: [2023-05-10 12:55:33,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +25: [2023-05-10 12:55:33,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_22-model_01-model_states.pt. +12: [2023-05-10 12:55:33,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +12: [2023-05-10 12:55:33,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +12: [2023-05-10 12:55:33,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... +22: [2023-05-10 12:55:33,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +29: [2023-05-10 12:55:33,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +22: [2023-05-10 12:55:33,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:33,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_00-model_states.pt. +22: [2023-05-10 12:55:33,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt... +18: [2023-05-10 12:55:33,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +29: [2023-05-10 12:55:33,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +30: [2023-05-10 12:55:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +30: [2023-05-10 12:55:33,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +30: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +30: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 3: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +18: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:55:33,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:33,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +23: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 3: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +27: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +17: [2023-05-10 12:55:33,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +31: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +27: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +20: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +27: [2023-05-10 12:55:33,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +17: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +27: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +17: [2023-05-10 12:55:33,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +31: [2023-05-10 12:55:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +20: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +26: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +25: [2023-05-10 12:55:33,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +29: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +31: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +31: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +20: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +20: [2023-05-10 12:55:33,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +10: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +18: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +18: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +23: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +23: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:33,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +18: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +25: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +10: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +16: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +25: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +29: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +29: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 0: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 0: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +23: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 1: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 4: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 1: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +26: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +10: [2023-05-10 12:55:33,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 6: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 9: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +16: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +15: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +15: [2023-05-10 12:55:33,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +26: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:33,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 9: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +15: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +26: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 6: [2023-05-10 12:55:33,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +10: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +15: [2023-05-10 12:55:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +16: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 4: [2023-05-10 12:55:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +16: [2023-05-10 12:55:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:33,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +19: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:33,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +24: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +24: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +24: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +22: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +24: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +11: [2023-05-10 12:55:33,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:33,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:33,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +21: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +21: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 7: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 7: [2023-05-10 12:55:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +19: [2023-05-10 12:55:33,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +12: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +19: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +21: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +28: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +21: [2023-05-10 12:55:33,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 5: [2023-05-10 12:55:33,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 5: [2023-05-10 12:55:33,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +12: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +12: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +13: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +12: [2023-05-10 12:55:33,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +19: [2023-05-10 12:55:33,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 8: [2023-05-10 12:55:33,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 8: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_23-model_01-model_states.pt. +14: [2023-05-10 12:55:33,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +11: [2023-05-10 12:55:33,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +22: [2023-05-10 12:55:33,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +28: [2023-05-10 12:55:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. + 2: [2023-05-10 12:55:33,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +22: [2023-05-10 12:55:33,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +22: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +11: [2023-05-10 12:55:33,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +11: [2023-05-10 12:55:33,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... + 2: [2023-05-10 12:55:33,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +13: [2023-05-10 12:55:33,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt... +14: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +14: [2023-05-10 12:55:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +14: [2023-05-10 12:55:33,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +28: [2023-05-10 12:55:33,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +28: [2023-05-10 12:55:33,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +13: [2023-05-10 12:55:33,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_00-model_states.pt. +13: [2023-05-10 12:55:33,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt... +17: [2023-05-10 12:55:33,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:33,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:33,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:33,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +17: [2023-05-10 12:55:33,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:33,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:33,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:33,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:33,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +18: [2023-05-10 12:55:33,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:33,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:33,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +23: [2023-05-10 12:55:33,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:33,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:33,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +27: [2023-05-10 12:55:33,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:33,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +20: [2023-05-10 12:55:33,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:33,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +31: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +30: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 3: [2023-05-10 12:55:33,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +25: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:33,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +29: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:33,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +15: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:33,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 4: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 9: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +10: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 1: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +21: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +16: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +26: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:33,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:33,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:33,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 0: [2023-05-10 12:55:33,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 7: [2023-05-10 12:55:33,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 5: [2023-05-10 12:55:33,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +28: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +24: [2023-05-10 12:55:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 8: [2023-05-10 12:55:33,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +22: [2023-05-10 12:55:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:33,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:33,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:33,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +13: [2023-05-10 12:55:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 6: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +11: [2023-05-10 12:55:33,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. + 2: [2023-05-10 12:55:33,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:33,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +12: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +14: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_24-model_01-model_states.pt. +19: [2023-05-10 12:55:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +27: [2023-05-10 12:55:34,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +27: [2023-05-10 12:55:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +27: [2023-05-10 12:55:34,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +31: [2023-05-10 12:55:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +31: [2023-05-10 12:55:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +10: [2023-05-10 12:55:34,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +10: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +27: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +20: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +20: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +16: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +17: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +14: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +16: [2023-05-10 12:55:34,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +17: [2023-05-10 12:55:34,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +10: [2023-05-10 12:55:34,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +10: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +20: [2023-05-10 12:55:34,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +31: [2023-05-10 12:55:34,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +14: [2023-05-10 12:55:34,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +16: [2023-05-10 12:55:34,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +14: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +17: [2023-05-10 12:55:34,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +26: [2023-05-10 12:55:34,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +28: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +28: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +18: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +26: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +13: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +13: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +21: [2023-05-10 12:55:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +21: [2023-05-10 12:55:34,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +21: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +22: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +30: [2023-05-10 12:55:34,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +30: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +23: [2023-05-10 12:55:34,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +25: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +15: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +19: [2023-05-10 12:55:34,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +28: [2023-05-10 12:55:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +18: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +19: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +13: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +11: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +18: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +23: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +29: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +29: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +22: [2023-05-10 12:55:34,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +24: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +11: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +12: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... +12: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +15: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +15: [2023-05-10 12:55:34,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +24: [2023-05-10 12:55:34,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... +11: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +25: [2023-05-10 12:55:34,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +30: [2023-05-10 12:55:34,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:34,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +29: [2023-05-10 12:55:34,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_00-model_states.pt. +12: [2023-05-10 12:55:34,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +16: [2023-05-10 12:55:34,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +16: [2023-05-10 12:55:34,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:55:34,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:55:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +17: [2023-05-10 12:55:34,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +14: [2023-05-10 12:55:34,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +14: [2023-05-10 12:55:34,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +17: [2023-05-10 12:55:34,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +17: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +22: [2023-05-10 12:55:34,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +26: [2023-05-10 12:55:34,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +18: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +23: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +26: [2023-05-10 12:55:34,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +26: [2023-05-10 12:55:34,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +26: [2023-05-10 12:55:34,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +10: [2023-05-10 12:55:34,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +28: [2023-05-10 12:55:34,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +15: [2023-05-10 12:55:34,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +27: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +27: [2023-05-10 12:55:34,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +31: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +31: [2023-05-10 12:55:34,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:34,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +10: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +10: [2023-05-10 12:55:34,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:34,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:34,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:34,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:55:34,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +10: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:34,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:34,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:34,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +31: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +21: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +10: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:34,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +31: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:34,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:34,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +29: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +31: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 0: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +25: [2023-05-10 12:55:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +30: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +13: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +27: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +27: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 3: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +12: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +24: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +11: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +22: [2023-05-10 12:55:34,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +27: [2023-05-10 12:55:34,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +19: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:34,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +22: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +22: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +19: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. + 4: [2023-05-10 12:55:34,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +11: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_25-model_01-model_states.pt. +20: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:34,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +19: [2023-05-10 12:55:34,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +19: [2023-05-10 12:55:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +11: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +28: [2023-05-10 12:55:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +20: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +11: [2023-05-10 12:55:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +21: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +21: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +20: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +30: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +20: [2023-05-10 12:55:34,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 2: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 0: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +20: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:34,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +19: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +15: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +13: [2023-05-10 12:55:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +30: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +13: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +21: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +30: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +18: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +18: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 9: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +24: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +23: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 2: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +16: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt... +14: [2023-05-10 12:55:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +28: [2023-05-10 12:55:34,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:34,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +21: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 9: [2023-05-10 12:55:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +28: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +23: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +14: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 2: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... +25: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +12: [2023-05-10 12:55:34,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt... + 5: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:34,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:34,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +18: [2023-05-10 12:55:34,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:34,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:34,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 3: [2023-05-10 12:55:34,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +25: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +21: [2023-05-10 12:55:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:34,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:34,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +13: [2023-05-10 12:55:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +29: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 3: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:34,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +15: [2023-05-10 12:55:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:34,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:34,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. + 4: [2023-05-10 12:55:34,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:34,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:34,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_00-model_states.pt. +16: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:34,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +16: [2023-05-10 12:55:34,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 1: [2023-05-10 12:55:34,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +16: [2023-05-10 12:55:34,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +17: [2023-05-10 12:55:34,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +16: [2023-05-10 12:55:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:34,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 1: [2023-05-10 12:55:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:34,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 8: [2023-05-10 12:55:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:34,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +14: [2023-05-10 12:55:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:34,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +17: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +14: [2023-05-10 12:55:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 5: [2023-05-10 12:55:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +26: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:34,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:55:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:55:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +22: [2023-05-10 12:55:34,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 6: [2023-05-10 12:55:34,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:34,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:34,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:34,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 8: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:34,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +26: [2023-05-10 12:55:35,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +26: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +26: [2023-05-10 12:55:35,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +22: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +26: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +22: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +22: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +11: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +11: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +11: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:35,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +10: [2023-05-10 12:55:35,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +11: [2023-05-10 12:55:35,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +10: [2023-05-10 12:55:35,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +31: [2023-05-10 12:55:35,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +10: [2023-05-10 12:55:35,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:35,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +31: [2023-05-10 12:55:35,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +25: [2023-05-10 12:55:35,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +29: [2023-05-10 12:55:35,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:35,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +19: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +17: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +20: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:35,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +21: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +21: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +25: [2023-05-10 12:55:35,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +17: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +30: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +17: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +30: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +13: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +24: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:35,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +15: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +31: [2023-05-10 12:55:35,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +18: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +24: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +24: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +24: [2023-05-10 12:55:35,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +18: [2023-05-10 12:55:35,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +31: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +31: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +29: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +31: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +20: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +25: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +20: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +29: [2023-05-10 12:55:35,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +23: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +23: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +23: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +23: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +12: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +13: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +13: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +13: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +30: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +30: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:35,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +28: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_26-model_01-model_states.pt. +20: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +27: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +20: [2023-05-10 12:55:35,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +25: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +12: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +12: [2023-05-10 12:55:35,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +28: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:35,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +18: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +26: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +26: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +16: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt... +15: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +15: [2023-05-10 12:55:35,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +16: [2023-05-10 12:55:35,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +18: [2023-05-10 12:55:35,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +15: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +27: [2023-05-10 12:55:35,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +19: [2023-05-10 12:55:35,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +14: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +28: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +27: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +14: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +12: [2023-05-10 12:55:35,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +28: [2023-05-10 12:55:35,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_00-model_states.pt. +19: [2023-05-10 12:55:35,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt... +19: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +22: [2023-05-10 12:55:35,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +19: [2023-05-10 12:55:35,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +19: [2023-05-10 12:55:35,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +21: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +21: [2023-05-10 12:55:35,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +21: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +21: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +11: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +23: [2023-05-10 12:55:35,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +13: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +24: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +14: [2023-05-10 12:55:35,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +23: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +29: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +30: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +25: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +25: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +15: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +28: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +18: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. +12: [2023-05-10 12:55:35,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_27-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +30: [2023-05-10 12:55:35,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +25: [2023-05-10 12:55:35,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +26: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +15: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +26: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +14: [2023-05-10 12:55:35,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +11: [2023-05-10 12:55:35,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +25: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +14: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +28: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +29: [2023-05-10 12:55:35,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +26: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +14: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +11: [2023-05-10 12:55:35,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +30: [2023-05-10 12:55:35,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +15: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +28: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +17: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +29: [2023-05-10 12:55:35,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +28: [2023-05-10 12:55:35,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +11: [2023-05-10 12:55:35,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +30: [2023-05-10 12:55:35,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +17: [2023-05-10 12:55:35,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +18: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +29: [2023-05-10 12:55:35,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +15: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 6: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +18: [2023-05-10 12:55:35,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +10: [2023-05-10 12:55:35,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +10: [2023-05-10 12:55:35,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +27: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +27: [2023-05-10 12:55:35,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +18: [2023-05-10 12:55:35,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +22: [2023-05-10 12:55:35,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +16: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +10: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +12: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +16: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +13: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +13: [2023-05-10 12:55:35,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +12: [2023-05-10 12:55:35,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +22: [2023-05-10 12:55:35,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +10: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +10: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +23: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +22: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +13: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +31: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +10: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +31: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:55:35,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:55:35,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... +20: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... +24: [2023-05-10 12:55:35,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +24: [2023-05-10 12:55:35,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +27: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +23: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +27: [2023-05-10 12:55:35,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +20: [2023-05-10 12:55:35,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +31: [2023-05-10 12:55:35,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +31: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +27: [2023-05-10 12:55:35,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_00-model_states.pt. +27: [2023-05-10 12:55:35,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +31: [2023-05-10 12:55:35,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +19: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +21: [2023-05-10 12:55:35,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +20: [2023-05-10 12:55:35,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +20: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 5: [2023-05-10 12:55:35,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +20: [2023-05-10 12:55:35,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +21: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +19: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +19: [2023-05-10 12:55:35,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +14: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +19: [2023-05-10 12:55:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +21: [2023-05-10 12:55:35,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +21: [2023-05-10 12:55:35,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +14: [2023-05-10 12:55:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +14: [2023-05-10 12:55:35,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +14: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +25: [2023-05-10 12:55:35,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +25: [2023-05-10 12:55:35,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +25: [2023-05-10 12:55:35,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +25: [2023-05-10 12:55:35,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:55:35,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:55:35,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +29: [2023-05-10 12:55:35,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +11: [2023-05-10 12:55:35,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +11: [2023-05-10 12:55:35,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:55:35,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +15: [2023-05-10 12:55:35,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +11: [2023-05-10 12:55:35,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +11: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +15: [2023-05-10 12:55:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +15: [2023-05-10 12:55:35,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +15: [2023-05-10 12:55:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +28: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +17: [2023-05-10 12:55:35,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:55:35,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +17: [2023-05-10 12:55:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +17: [2023-05-10 12:55:35,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +30: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +17: [2023-05-10 12:55:35,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +26: [2023-05-10 12:55:35,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +26: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +26: [2023-05-10 12:55:35,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +23: [2023-05-10 12:55:35,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +12: [2023-05-10 12:55:35,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +26: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +30: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +24: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +18: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +13: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +29: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +28: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +23: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +16: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_28-model_01-model_states.pt. +22: [2023-05-10 12:55:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +12: [2023-05-10 12:55:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +22: [2023-05-10 12:55:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +24: [2023-05-10 12:55:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +18: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +16: [2023-05-10 12:55:35,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +30: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +30: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +13: [2023-05-10 12:55:35,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... +28: [2023-05-10 12:55:35,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:55:35,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +24: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +23: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 6: [2023-05-10 12:55:35,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +13: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +18: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +22: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 0: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +24: [2023-05-10 12:55:35,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +29: [2023-05-10 12:55:35,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +12: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +18: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +12: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +23: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +28: [2023-05-10 12:55:35,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +16: [2023-05-10 12:55:35,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 4: [2023-05-10 12:55:35,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +22: [2023-05-10 12:55:35,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. +29: [2023-05-10 12:55:35,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +16: [2023-05-10 12:55:35,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... +10: [2023-05-10 12:55:35,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:35,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 5: [2023-05-10 12:55:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt... + 8: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:35,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:35,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:35,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:35,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:35,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +20: [2023-05-10 12:55:35,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 5: [2023-05-10 12:55:35,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:35,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:35,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +25: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +19: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +25: [2023-05-10 12:55:35,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +19: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +25: [2023-05-10 12:55:35,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 1: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +10: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +21: [2023-05-10 12:55:35,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +11: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 8: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 3: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +10: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +19: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 8: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 8: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +27: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +21: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +14: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +15: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +31: [2023-05-10 12:55:35,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +20: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:35,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +31: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +19: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:35,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +31: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +14: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +14: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:35,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +15: [2023-05-10 12:55:35,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +10: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +10: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +21: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +21: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:35,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 3: [2023-05-10 12:55:35,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:35,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 1: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 1: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:35,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:35,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +27: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +14: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +27: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +11: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:35,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:35,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +11: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:35,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:35,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:55:35,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:35,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +11: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:35,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +15: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +15: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 7: [2023-05-10 12:55:35,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 3: [2023-05-10 12:55:35,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:35,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 7: [2023-05-10 12:55:35,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 7: [2023-05-10 12:55:35,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:35,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +30: [2023-05-10 12:55:35,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:35,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +30: [2023-05-10 12:55:35,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +30: [2023-05-10 12:55:35,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +30: [2023-05-10 12:55:35,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:35,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:35,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:35,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:35,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:35,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +24: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +24: [2023-05-10 12:55:35,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:35,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:35,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:35,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 2: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 2: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +26: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +24: [2023-05-10 12:55:35,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +24: [2023-05-10 12:55:35,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:35,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +16: [2023-05-10 12:55:35,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:35,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:35,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +18: [2023-05-10 12:55:35,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:35,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:35,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:35,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:35,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:35,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +29: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:36,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +16: [2023-05-10 12:55:36,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +26: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +18: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +26: [2023-05-10 12:55:36,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +17: [2023-05-10 12:55:36,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +18: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +16: [2023-05-10 12:55:36,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +18: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +23: [2023-05-10 12:55:36,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +29: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +29: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +29: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +13: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +16: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +12: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +17: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +17: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +17: [2023-05-10 12:55:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:36,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +13: [2023-05-10 12:55:36,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +12: [2023-05-10 12:55:36,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +28: [2023-05-10 12:55:36,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +23: [2023-05-10 12:55:36,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:36,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +23: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +23: [2023-05-10 12:55:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +22: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_29-model_01-model_states.pt. +28: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +12: [2023-05-10 12:55:36,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +13: [2023-05-10 12:55:36,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +28: [2023-05-10 12:55:36,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +28: [2023-05-10 12:55:36,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +12: [2023-05-10 12:55:36,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +13: [2023-05-10 12:55:36,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... +22: [2023-05-10 12:55:36,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. +22: [2023-05-10 12:55:36,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +22: [2023-05-10 12:55:36,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt... +25: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +25: [2023-05-10 12:55:36,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +27: [2023-05-10 12:55:36,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:55:36,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +21: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +11: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +19: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +18: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +31: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +31: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +21: [2023-05-10 12:55:36,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +20: [2023-05-10 12:55:36,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +21: [2023-05-10 12:55:36,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +11: [2023-05-10 12:55:36,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +12: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +31: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +21: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +10: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +15: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +14: [2023-05-10 12:55:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +20: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +16: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +31: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +14: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +14: [2023-05-10 12:55:36,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +14: [2023-05-10 12:55:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +29: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +28: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +20: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +20: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:55:36,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +10: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +10: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +10: [2023-05-10 12:55:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +15: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +19: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +24: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +30: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +30: [2023-05-10 12:55:36,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +15: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +15: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +30: [2023-05-10 12:55:36,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +23: [2023-05-10 12:55:36,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +24: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +24: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +13: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +30: [2023-05-10 12:55:36,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +13: [2023-05-10 12:55:36,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +12: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +19: [2023-05-10 12:55:36,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +13: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +19: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +24: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +23: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +13: [2023-05-10 12:55:36,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +28: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +26: [2023-05-10 12:55:36,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +12: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +12: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +18: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +17: [2023-05-10 12:55:36,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +23: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +23: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +26: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:55:36,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +22: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. +25: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +18: [2023-05-10 12:55:36,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +28: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +26: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +25: [2023-05-10 12:55:36,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +26: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_30-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +22: [2023-05-10 12:55:36,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +27: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +27: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +27: [2023-05-10 12:55:36,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +17: [2023-05-10 12:55:36,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +29: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +28: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +29: [2023-05-10 12:55:36,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:55:36,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +11: [2023-05-10 12:55:36,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +22: [2023-05-10 12:55:36,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +22: [2023-05-10 12:55:36,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +11: [2023-05-10 12:55:36,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +29: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt... +16: [2023-05-10 12:55:36,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt... +17: [2023-05-10 12:55:36,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +25: [2023-05-10 12:55:36,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +17: [2023-05-10 12:55:36,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +25: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_00-model_states.pt. +16: [2023-05-10 12:55:36,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +31: [2023-05-10 12:55:36,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +31: [2023-05-10 12:55:36,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 9: [2023-05-10 12:55:36,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +31: [2023-05-10 12:55:36,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 5: [2023-05-10 12:55:36,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +10: [2023-05-10 12:55:36,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +10: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:55:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +21: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +25: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +21: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +24: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +24: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:55:36,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +30: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +24: [2023-05-10 12:55:36,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 1: [2023-05-10 12:55:36,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +21: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +21: [2023-05-10 12:55:36,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +24: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:55:36,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +18: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +30: [2023-05-10 12:55:36,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +30: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +18: [2023-05-10 12:55:36,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +18: [2023-05-10 12:55:36,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +12: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +18: [2023-05-10 12:55:36,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:36,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 6: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +15: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +12: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +15: [2023-05-10 12:55:36,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 6: [2023-05-10 12:55:36,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:36,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +17: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +29: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +11: [2023-05-10 12:55:36,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:36,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +15: [2023-05-10 12:55:36,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:36,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +28: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +17: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +27: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:36,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +17: [2023-05-10 12:55:36,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 6: [2023-05-10 12:55:36,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +15: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +11: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +29: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +27: [2023-05-10 12:55:36,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +13: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +29: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +29: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +28: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +27: [2023-05-10 12:55:36,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +27: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +11: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 0: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +22: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +26: [2023-05-10 12:55:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:36,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +28: [2023-05-10 12:55:36,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:36,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +13: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +13: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:55:36,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +23: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +26: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +20: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +23: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:36,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +28: [2023-05-10 12:55:36,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:55:36,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +26: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +26: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +14: [2023-05-10 12:55:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 9: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +16: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. + 2: [2023-05-10 12:55:36,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_31-model_01-model_states.pt. +19: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +13: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 4: [2023-05-10 12:55:36,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +23: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +22: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:36,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +25: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... + 4: [2023-05-10 12:55:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +19: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +16: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +20: [2023-05-10 12:55:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +14: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt... +22: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +22: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 4: [2023-05-10 12:55:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:36,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +20: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... + 2: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +20: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +23: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +14: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +12: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +19: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +31: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +12: [2023-05-10 12:55:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +14: [2023-05-10 12:55:36,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:55:36,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +19: [2023-05-10 12:55:36,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +16: [2023-05-10 12:55:36,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +10: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:36,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:36,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +10: [2023-05-10 12:55:36,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +25: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 3: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:55:36,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_00-model_states.pt. +16: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt... +25: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +10: [2023-05-10 12:55:36,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:36,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:36,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:36,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:36,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +11: [2023-05-10 12:55:36,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:36,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 8: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:36,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:36,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:36,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +31: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:36,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +31: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:36,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:36,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:36,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 5: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:36,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:36,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:36,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +18: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:36,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +10: [2023-05-10 12:55:36,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:36,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:36,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:36,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:36,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:36,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:36,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:55:36,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 7: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:36,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +24: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:36,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:36,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +10: [2023-05-10 12:55:36,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +10: [2023-05-10 12:55:36,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:36,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +18: [2023-05-10 12:55:36,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:36,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:36,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:36,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +21: [2023-05-10 12:55:37,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +21: [2023-05-10 12:55:37,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:37,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +21: [2023-05-10 12:55:37,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +24: [2023-05-10 12:55:37,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +24: [2023-05-10 12:55:37,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:37,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:37,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:37,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +25: [2023-05-10 12:55:37,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:37,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +25: [2023-05-10 12:55:37,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:37,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +15: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +12: [2023-05-10 12:55:37,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +28: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +25: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:37,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:37,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +12: [2023-05-10 12:55:37,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +22: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +17: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +15: [2023-05-10 12:55:37,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +15: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:37,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +17: [2023-05-10 12:55:37,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +30: [2023-05-10 12:55:37,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +17: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +23: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:37,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:37,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +28: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +15: [2023-05-10 12:55:37,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:37,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:37,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +26: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +30: [2023-05-10 12:55:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +28: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +28: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +17: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +26: [2023-05-10 12:55:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +27: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +19: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +16: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +30: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +26: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +13: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +13: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +30: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +22: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:37,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +27: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:37,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +31: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +20: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +26: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +22: [2023-05-10 12:55:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +22: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +19: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +16: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +27: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +23: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +27: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +11: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +12: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +20: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +31: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +23: [2023-05-10 12:55:37,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +29: [2023-05-10 12:55:37,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +20: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +14: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +12: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:55:37,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +13: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_32-model_01-model_states.pt. +29: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +29: [2023-05-10 12:55:37,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:37,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +19: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +16: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +20: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +19: [2023-05-10 12:55:37,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +11: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +11: [2023-05-10 12:55:37,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +14: [2023-05-10 12:55:37,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +29: [2023-05-10 12:55:37,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt... +13: [2023-05-10 12:55:37,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +18: [2023-05-10 12:55:37,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +12: [2023-05-10 12:55:37,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +24: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +21: [2023-05-10 12:55:37,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +23: [2023-05-10 12:55:37,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +14: [2023-05-10 12:55:37,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +14: [2023-05-10 12:55:37,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... +18: [2023-05-10 12:55:37,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_00-model_states.pt. +16: [2023-05-10 12:55:37,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:55:37,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +21: [2023-05-10 12:55:37,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +21: [2023-05-10 12:55:37,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +27: [2023-05-10 12:55:37,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +25: [2023-05-10 12:55:37,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +27: [2023-05-10 12:55:37,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +10: [2023-05-10 12:55:37,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +24: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +31: [2023-05-10 12:55:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +10: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +15: [2023-05-10 12:55:37,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +31: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +10: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +17: [2023-05-10 12:55:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +29: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +15: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:55:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +20: [2023-05-10 12:55:37,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +20: [2023-05-10 12:55:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +17: [2023-05-10 12:55:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +17: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +17: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +15: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +15: [2023-05-10 12:55:37,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +11: [2023-05-10 12:55:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +29: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +20: [2023-05-10 12:55:37,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +21: [2023-05-10 12:55:37,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +27: [2023-05-10 12:55:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +10: [2023-05-10 12:55:37,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +21: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +25: [2023-05-10 12:55:37,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +23: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +12: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +16: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +27: [2023-05-10 12:55:37,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:55:37,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +23: [2023-05-10 12:55:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +23: [2023-05-10 12:55:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +23: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +16: [2023-05-10 12:55:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +31: [2023-05-10 12:55:37,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +28: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +28: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +26: [2023-05-10 12:55:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +31: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +24: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +24: [2023-05-10 12:55:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +30: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +26: [2023-05-10 12:55:37,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +28: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +30: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +16: [2023-05-10 12:55:37,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +13: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +22: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +19: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +12: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +18: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +18: [2023-05-10 12:55:37,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +28: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +29: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +18: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +26: [2023-05-10 12:55:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +16: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +22: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +11: [2023-05-10 12:55:37,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +29: [2023-05-10 12:55:37,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +19: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +28: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +13: [2023-05-10 12:55:37,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +11: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:55:37,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +28: [2023-05-10 12:55:37,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +22: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +30: [2023-05-10 12:55:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +30: [2023-05-10 12:55:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +26: [2023-05-10 12:55:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +12: [2023-05-10 12:55:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +12: [2023-05-10 12:55:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +22: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +13: [2023-05-10 12:55:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +19: [2023-05-10 12:55:37,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +19: [2023-05-10 12:55:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +20: [2023-05-10 12:55:37,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +18: [2023-05-10 12:55:37,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +13: [2023-05-10 12:55:37,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +18: [2023-05-10 12:55:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +18: [2023-05-10 12:55:37,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +18: [2023-05-10 12:55:37,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +27: [2023-05-10 12:55:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:55:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +21: [2023-05-10 12:55:37,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:55:37,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +21: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_33-model_01-model_states.pt. +14: [2023-05-10 12:55:37,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +14: [2023-05-10 12:55:37,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +25: [2023-05-10 12:55:37,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt... +25: [2023-05-10 12:55:37,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +21: [2023-05-10 12:55:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +21: [2023-05-10 12:55:37,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +14: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +24: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_00-model_states.pt. +14: [2023-05-10 12:55:37,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt... +25: [2023-05-10 12:55:37,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +24: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +25: [2023-05-10 12:55:37,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +25: [2023-05-10 12:55:37,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +24: [2023-05-10 12:55:37,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +24: [2023-05-10 12:55:37,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +24: [2023-05-10 12:55:37,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +28: [2023-05-10 12:55:37,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +26: [2023-05-10 12:55:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:37,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +15: [2023-05-10 12:55:37,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +26: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +17: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +26: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +26: [2023-05-10 12:55:37,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 7: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +15: [2023-05-10 12:55:37,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:55:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +31: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 0: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:55:37,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +15: [2023-05-10 12:55:37,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:37,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:37,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 3: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 7: [2023-05-10 12:55:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:55:37,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... + 5: [2023-05-10 12:55:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +27: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:37,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:37,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +31: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:37,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +27: [2023-05-10 12:55:37,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +17: [2023-05-10 12:55:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +30: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +10: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:55:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +16: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 1: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +23: [2023-05-10 12:55:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +19: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +17: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +20: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 2: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +13: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +12: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +11: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +12: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +12: [2023-05-10 12:55:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +30: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +20: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +15: [2023-05-10 12:55:37,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +10: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +22: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +13: [2023-05-10 12:55:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +28: [2023-05-10 12:55:37,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +14: [2023-05-10 12:55:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +22: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +27: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +27: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +16: [2023-05-10 12:55:37,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. +29: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_34-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +20: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +19: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +14: [2023-05-10 12:55:37,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +11: [2023-05-10 12:55:37,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +10: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +16: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +10: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +16: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +10: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +29: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +23: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt... +23: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +13: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +13: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +11: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +11: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +19: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +30: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +30: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +19: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... +14: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +28: [2023-05-10 12:55:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +28: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +22: [2023-05-10 12:55:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +14: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +22: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 6: [2023-05-10 12:55:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +20: [2023-05-10 12:55:37,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +29: [2023-05-10 12:55:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +31: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +25: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +23: [2023-05-10 12:55:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +14: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 9: [2023-05-10 12:55:37,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 3: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:37,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 6: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 8: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:37,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_00-model_states.pt. +18: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt... +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:37,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +28: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: > overriding learning rate value to 0.0002 +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine + 0: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:37,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:37,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:37,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:37,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:37,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:37,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:37,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +27: [2023-05-10 12:55:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 8: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:37,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +23: [2023-05-10 12:55:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +29: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +25: [2023-05-10 12:55:37,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:37,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... +16: [2023-05-10 12:55:37,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:37,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +31: [2023-05-10 12:55:37,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +20: [2023-05-10 12:55:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 9: [2023-05-10 12:55:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:55:37,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +15: [2023-05-10 12:55:37,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +18: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... + 1: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +18: [2023-05-10 12:55:37,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... +26: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... +12: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 4: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +13: [2023-05-10 12:55:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +19: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... +18: [2023-05-10 12:55:37,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:37,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:37,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:37,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... + 2: [2023-05-10 12:55:37,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +25: [2023-05-10 12:55:37,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +15: [2023-05-10 12:55:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +30: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... +11: [2023-05-10 12:55:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... +24: [2023-05-10 12:55:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +21: [2023-05-10 12:55:37,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:55:37,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +25: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:37,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:37,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +22: [2023-05-10 12:55:37,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +15: [2023-05-10 12:55:37,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 5: [2023-05-10 12:55:37,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +24: [2023-05-10 12:55:37,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +21: [2023-05-10 12:55:37,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:37,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:37,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:37,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:37,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 5: [2023-05-10 12:55:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +24: [2023-05-10 12:55:37,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +24: [2023-05-10 12:55:37,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:37,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +28: [2023-05-10 12:55:38,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +26: [2023-05-10 12:55:38,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +26: [2023-05-10 12:55:38,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:38,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +17: [2023-05-10 12:55:38,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +28: [2023-05-10 12:55:38,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +26: [2023-05-10 12:55:38,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +26: [2023-05-10 12:55:38,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:38,071] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 40 + 5: [2023-05-10 12:55:38,075] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 40 + 6: [2023-05-10 12:55:38,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +17: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +31: [2023-05-10 12:55:38,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +31: [2023-05-10 12:55:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +31: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:38,122] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 138 +31: [2023-05-10 12:55:38,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +31: [2023-05-10 12:55:38,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +17: [2023-05-10 12:55:38,126] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 138 + 2: [2023-05-10 12:55:38,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +19: [2023-05-10 12:55:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +19: [2023-05-10 12:55:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +19: [2023-05-10 12:55:38,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +19: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,141] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 26 +19: [2023-05-10 12:55:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +20: [2023-05-10 12:55:38,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +20: [2023-05-10 12:55:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,146] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 26 + 0: [2023-05-10 12:55:38,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 7: [2023-05-10 12:55:38,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:55:38,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,153] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 56 + 4: [2023-05-10 12:55:38,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,157] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 56 +20: [2023-05-10 12:55:38,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:55:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +20: [2023-05-10 12:55:38,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +20: [2023-05-10 12:55:38,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:38,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +10: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +23: [2023-05-10 12:55:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +29: [2023-05-10 12:55:38,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +30: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +12: [2023-05-10 12:55:38,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +16: [2023-05-10 12:55:38,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +27: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +27: [2023-05-10 12:55:38,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +27: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +14: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 3: [2023-05-10 12:55:38,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +10: [2023-05-10 12:55:38,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +23: [2023-05-10 12:55:38,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +27: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +27: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +16: [2023-05-10 12:55:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:38,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:38,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:55:38,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +22: [2023-05-10 12:55:38,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +13: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +29: [2023-05-10 12:55:38,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +29: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:55:38,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +13: [2023-05-10 12:55:38,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... + 3: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +27: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +29: [2023-05-10 12:55:38,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +14: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +14: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +30: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +30: [2023-05-10 12:55:38,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:55:38,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +30: [2023-05-10 12:55:38,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +25: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:55:38,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +16: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +23: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +18: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +22: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +12: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +12: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +14: [2023-05-10 12:55:38,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +12: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +10: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +10: [2023-05-10 12:55:38,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 5: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +21: [2023-05-10 12:55:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +21: [2023-05-10 12:55:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +18: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 5: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 5: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +24: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +25: [2023-05-10 12:55:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +25: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +18: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +24: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +18: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +24: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +25: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +25: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +15: [2023-05-10 12:55:38,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +18: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +18: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +18: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +16: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +24: [2023-05-10 12:55:38,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +15: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +15: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 7: [2023-05-10 12:55:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +24: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:38,225] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 60 +24: [2023-05-10 12:55:38,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,225] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 52 +13: [2023-05-10 12:55:38,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +13: [2023-05-10 12:55:38,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +22: [2023-05-10 12:55:38,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +22: [2023-05-10 12:55:38,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +13: [2023-05-10 12:55:38,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,229] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 60 + 6: [2023-05-10 12:55:38,229] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 52 +13: [2023-05-10 12:55:38,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +11: [2023-05-10 12:55:38,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:38,233] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 142 +11: [2023-05-10 12:55:38,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_35-model_01-model_states.pt. +17: [2023-05-10 12:55:38,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:38,236] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 136 +27: [2023-05-10 12:55:38,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:38,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 222 +17: [2023-05-10 12:55:38,238] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 142 +28: [2023-05-10 12:55:38,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:38,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 226 +17: [2023-05-10 12:55:38,240] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 136 +28: [2023-05-10 12:55:38,243] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 226 +27: [2023-05-10 12:55:38,243] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 222 + 3: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt... + 3: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +28: [2023-05-10 12:55:38,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:55:38,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:55:38,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:55:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +15: [2023-05-10 12:55:38,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:38,248] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 122 +16: [2023-05-10 12:55:38,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:38,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 132 +11: [2023-05-10 12:55:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +11: [2023-05-10 12:55:38,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt... +23: [2023-05-10 12:55:38,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:38,251] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 190 +27: [2023-05-10 12:55:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,253] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 122 + 5: [2023-05-10 12:55:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt... + 5: [2023-05-10 12:55:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,255] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 132 +23: [2023-05-10 12:55:38,255] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 190 + 8: [2023-05-10 12:55:38,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:38,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:38,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 64 +10: [2023-05-10 12:55:38,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 80 +28: [2023-05-10 12:55:38,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +28: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:38,257] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 82 +18: [2023-05-10 12:55:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,260] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 64 +10: [2023-05-10 12:55:38,260] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 80 +11: [2023-05-10 12:55:38,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +28: [2023-05-10 12:55:38,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,261] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 82 +29: [2023-05-10 12:55:38,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:38,262] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 232 +31: [2023-05-10 12:55:38,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,264] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 254 +29: [2023-05-10 12:55:38,266] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 232 +21: [2023-05-10 12:55:38,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt... +25: [2023-05-10 12:55:38,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:38,269] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 216 +31: [2023-05-10 12:55:38,269] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 254 +26: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +26: [2023-05-10 12:55:38,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +27: [2023-05-10 12:55:38,274] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 216 + 6: [2023-05-10 12:55:38,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:55:38,275] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 48 +11: [2023-05-10 12:55:38,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. +11: [2023-05-10 12:55:38,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 7: [2023-05-10 12:55:38,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt... + 7: [2023-05-10 12:55:38,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:38,278] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 124 +11: [2023-05-10 12:55:38,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +11: [2023-05-10 12:55:38,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,279] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 48 +11: [2023-05-10 12:55:38,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt... +15: [2023-05-10 12:55:38,282] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 124 +26: [2023-05-10 12:55:38,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +24: [2023-05-10 12:55:38,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,285] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 106 +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +26: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +25: [2023-05-10 12:55:38,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:38,287] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 200 + 3: [2023-05-10 12:55:38,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:38,289] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 24 +26: [2023-05-10 12:55:38,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,292] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 186 +25: [2023-05-10 12:55:38,292] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 200 +13: [2023-05-10 12:55:38,292] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 106 + 8: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +15: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt... +15: [2023-05-10 12:55:38,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 3: [2023-05-10 12:55:38,294] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 24 + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +17: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,295] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 118 + 8: [2023-05-10 12:55:38,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,296] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 186 + 8: [2023-05-10 12:55:38,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,299] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 118 + 6: [2023-05-10 12:55:38,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 6: [2023-05-10 12:55:38,300] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 54 +17: [2023-05-10 12:55:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,304] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 160 +17: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +17: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +17: [2023-05-10 12:55:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,305] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 54 +17: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +17: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,308] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 160 + 5: [2023-05-10 12:55:38,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:38,313] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 46 + 3: [2023-05-10 12:55:38,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:38,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 28 + 0: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 3: [2023-05-10 12:55:38,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 28 + 7: [2023-05-10 12:55:38,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:38,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 46 + 7: [2023-05-10 12:55:38,318] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 58 + 7: [2023-05-10 12:55:38,323] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 58 + 9: [2023-05-10 12:55:38,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:55:38,324] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 76 + 0: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +28: [2023-05-10 12:55:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt... +28: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 0: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:38,329] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 96 + 9: [2023-05-10 12:55:38,329] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 76 +19: [2023-05-10 12:55:38,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:38,329] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 154 + 6: [2023-05-10 12:55:38,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +28: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:38,331] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 230 + 0: [2023-05-10 12:55:38,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,333] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 96 +19: [2023-05-10 12:55:38,334] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 154 +28: [2023-05-10 12:55:38,335] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 230 + 6: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 6: [2023-05-10 12:55:38,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,343] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 176 + 6: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +17: [2023-05-10 12:55:38,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +17: [2023-05-10 12:55:38,343] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 140 +17: [2023-05-10 12:55:38,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt... +17: [2023-05-10 12:55:38,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt... +24: [2023-05-10 12:55:38,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:38,347] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 192 +17: [2023-05-10 12:55:38,348] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 140 + 1: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +26: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +26: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt... +26: [2023-05-10 12:55:38,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,349] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 176 +10: [2023-05-10 12:55:38,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:55:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:38,350] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 84 + 1: [2023-05-10 12:55:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 0: [2023-05-10 12:55:38,350] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 2 + 1: [2023-05-10 12:55:38,350] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 8 +20: [2023-05-10 12:55:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +20: [2023-05-10 12:55:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 1: [2023-05-10 12:55:38,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 8: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 8: [2023-05-10 12:55:38,353] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 70 +10: [2023-05-10 12:55:38,354] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 84 +24: [2023-05-10 12:55:38,354] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 192 +28: [2023-05-10 12:55:38,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:38,354] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 8 +20: [2023-05-10 12:55:38,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +28: [2023-05-10 12:55:38,354] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 228 +20: [2023-05-10 12:55:38,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,355] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 2 + 1: [2023-05-10 12:55:38,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. + 1: [2023-05-10 12:55:38,356] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 10 + 8: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 8: [2023-05-10 12:55:38,358] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 70 +13: [2023-05-10 12:55:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:38,359] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 228 +20: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,359] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 108 +15: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +15: [2023-05-10 12:55:38,359] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 126 +27: [2023-05-10 12:55:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:38,360] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 220 + 1: [2023-05-10 12:55:38,360] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 10 + 5: [2023-05-10 12:55:38,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:38,361] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 44 +20: [2023-05-10 12:55:38,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:55:38,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,363] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 108 +15: [2023-05-10 12:55:38,364] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 126 +20: [2023-05-10 12:55:38,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +20: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 5: [2023-05-10 12:55:38,365] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 44 +20: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 7: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. + 7: [2023-05-10 12:55:38,367] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 62 +20: [2023-05-10 12:55:38,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +20: [2023-05-10 12:55:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +27: [2023-05-10 12:55:38,368] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 220 +13: [2023-05-10 12:55:38,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. +13: [2023-05-10 12:55:38,370] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 110 +19: [2023-05-10 12:55:38,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:38,370] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 158 +25: [2023-05-10 12:55:38,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:38,371] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 202 +18: [2023-05-10 12:55:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:38,371] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 146 + 7: [2023-05-10 12:55:38,371] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 62 +19: [2023-05-10 12:55:38,374] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 158 +13: [2023-05-10 12:55:38,375] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 110 +18: [2023-05-10 12:55:38,376] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 146 +25: [2023-05-10 12:55:38,376] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 202 +11: [2023-05-10 12:55:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:38,378] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 94 +24: [2023-05-10 12:55:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:38,379] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 198 + 0: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt... + 0: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:55:38,380] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 72 + 6: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt... + 6: [2023-05-10 12:55:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,382] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 94 +22: [2023-05-10 12:55:38,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,383] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 182 +24: [2023-05-10 12:55:38,383] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 198 + 9: [2023-05-10 12:55:38,385] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 72 +14: [2023-05-10 12:55:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:38,387] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 112 +22: [2023-05-10 12:55:38,388] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 182 + 8: [2023-05-10 12:55:38,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:38,388] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 68 +31: [2023-05-10 12:55:38,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,390] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 250 +14: [2023-05-10 12:55:38,391] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 112 + 8: [2023-05-10 12:55:38,392] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 68 +31: [2023-05-10 12:55:38,394] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 250 +26: [2023-05-10 12:55:38,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,396] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 210 +16: [2023-05-10 12:55:38,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:38,398] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 134 +16: [2023-05-10 12:55:38,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. +16: [2023-05-10 12:55:38,400] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 128 +26: [2023-05-10 12:55:38,401] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 210 +16: [2023-05-10 12:55:38,402] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 134 + 1: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt... + 1: [2023-05-10 12:55:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,404] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 128 +18: [2023-05-10 12:55:38,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:38,405] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 148 +28: [2023-05-10 12:55:38,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:38,405] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 224 +20: [2023-05-10 12:55:38,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt... +20: [2023-05-10 12:55:38,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt... + 8: [2023-05-10 12:55:38,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. + 8: [2023-05-10 12:55:38,407] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 66 +18: [2023-05-10 12:55:38,409] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 148 +28: [2023-05-10 12:55:38,410] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 224 + 8: [2023-05-10 12:55:38,411] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 66 +12: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:38,413] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 100 + 9: [2023-05-10 12:55:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:55:38,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 74 +24: [2023-05-10 12:55:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:38,414] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 196 + 9: [2023-05-10 12:55:38,416] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 74 + 4: [2023-05-10 12:55:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:38,416] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 34 +12: [2023-05-10 12:55:38,417] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 100 +31: [2023-05-10 12:55:38,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,418] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 248 +24: [2023-05-10 12:55:38,419] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 196 + 4: [2023-05-10 12:55:38,421] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 34 +15: [2023-05-10 12:55:38,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:38,421] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 120 +23: [2023-05-10 12:55:38,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,424] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 248 +23: [2023-05-10 12:55:38,423] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 184 +30: [2023-05-10 12:55:38,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:38,424] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 240 +22: [2023-05-10 12:55:38,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +15: [2023-05-10 12:55:38,426] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 120 +22: [2023-05-10 12:55:38,426] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 178 +23: [2023-05-10 12:55:38,427] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 184 +31: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,428] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 240 + 9: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,430] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 178 +14: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,433] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 104 + 2: [2023-05-10 12:55:38,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:38,434] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 170 + 2: [2023-05-10 12:55:38,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:38,437] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 22 +10: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,437] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 104 +23: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +21: [2023-05-10 12:55:38,438] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 170 +31: [2023-05-10 12:55:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +31: [2023-05-10 12:55:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,440] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 38 +29: [2023-05-10 12:55:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +31: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +31: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,442] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 22 +19: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +14: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. + 9: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 9: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,443] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 130 + 9: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 9: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 2: [2023-05-10 12:55:38,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 6: [2023-05-10 12:55:38,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +31: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 6: [2023-05-10 12:55:38,445] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 50 +21: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 2: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,445] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 14 +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +21: [2023-05-10 12:55:38,445] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 174 +20: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +13: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,445] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 38 + 4: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +22: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +31: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +20: [2023-05-10 12:55:38,445] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 162 +19: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +14: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +14: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +14: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +14: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +19: [2023-05-10 12:55:38,446] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 156 +19: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,447] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 130 +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,447] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 0 +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +23: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +12: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:38,448] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 234 +16: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 6: [2023-05-10 12:55:38,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 50 +13: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 1: [2023-05-10 12:55:38,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 14 +23: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +20: [2023-05-10 12:55:38,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 162 +13: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +10: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +19: [2023-05-10 12:55:38,450] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 156 +29: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +10: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +23: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +23: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +10: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +10: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +16: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +10: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 2: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 1: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +21: [2023-05-10 12:55:38,451] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 174 + 1: [2023-05-10 12:55:38,451] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 12 +23: [2023-05-10 12:55:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 0: [2023-05-10 12:55:38,452] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 0 +29: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +30: [2023-05-10 12:55:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +29: [2023-05-10 12:55:38,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,453] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 234 +30: [2023-05-10 12:55:38,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. +11: [2023-05-10 12:55:38,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_36-model_01-model_states.pt. + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 + 2: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 2: [2023-05-10 12:55:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +13: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 1: [2023-05-10 12:55:38,456] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 12 + 4: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +13: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +29: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 9: [2023-05-10 12:55:38,456] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 78 + 4: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. + 4: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +29: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +29: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +12: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +12: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +12: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 4: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +22: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 9: [2023-05-10 12:55:38,460] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 78 +11: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +29: [2023-05-10 12:55:38,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +16: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +16: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +12: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +16: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... + 4: [2023-05-10 12:55:38,462] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 36 +12: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 0: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +11: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,464] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 6 +12: [2023-05-10 12:55:38,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:38,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:38,465] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 102 +14: [2023-05-10 12:55:38,465] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 114 +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt... +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +30: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_00-model_states.pt. +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +11: [2023-05-10 12:55:38,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. + 4: [2023-05-10 12:55:38,466] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 36 +11: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... +30: [2023-05-10 12:55:38,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt... + 0: [2023-05-10 12:55:38,469] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 6 +12: [2023-05-10 12:55:38,469] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 102 +14: [2023-05-10 12:55:38,470] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 114 +10: [2023-05-10 12:55:38,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +10: [2023-05-10 12:55:38,470] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 86 +30: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +30: [2023-05-10 12:55:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/layer_38-model_01-model_states.pt. +26: [2023-05-10 12:55:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,474] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 208 +26: [2023-05-10 12:55:38,474] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 214 +10: [2023-05-10 12:55:38,475] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 86 +30: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:38,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 242 +21: [2023-05-10 12:55:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:38,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 168 +29: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:38,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 238 +30: [2023-05-10 12:55:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:38,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 246 +26: [2023-05-10 12:55:38,478] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 214 +26: [2023-05-10 12:55:38,478] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 208 + 9: [2023-05-10 12:55:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt... + 9: [2023-05-10 12:55:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,481] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 242 +21: [2023-05-10 12:55:38,481] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 168 +29: [2023-05-10 12:55:38,481] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 238 +31: [2023-05-10 12:55:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt... +31: [2023-05-10 12:55:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,481] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 246 +19: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:38,486] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 18 +19: [2023-05-10 12:55:38,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. +19: [2023-05-10 12:55:38,486] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 152 +14: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt... +14: [2023-05-10 12:55:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt... +13: [2023-05-10 12:55:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt... +19: [2023-05-10 12:55:38,491] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 152 + 2: [2023-05-10 12:55:38,491] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 18 +10: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt... +10: [2023-05-10 12:55:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +21: [2023-05-10 12:55:38,494] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 172 +23: [2023-05-10 12:55:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt... +23: [2023-05-10 12:55:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +27: [2023-05-10 12:55:38,496] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 218 +16: [2023-05-10 12:55:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt... +16: [2023-05-10 12:55:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt... +21: [2023-05-10 12:55:38,498] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 172 +23: [2023-05-10 12:55:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +23: [2023-05-10 12:55:38,499] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 188 +31: [2023-05-10 12:55:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +31: [2023-05-10 12:55:38,499] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 252 + 4: [2023-05-10 12:55:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt... + 4: [2023-05-10 12:55:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt... +27: [2023-05-10 12:55:38,500] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 218 +18: [2023-05-10 12:55:38,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt... +29: [2023-05-10 12:55:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt... +18: [2023-05-10 12:55:38,503] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 144 +23: [2023-05-10 12:55:38,503] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 188 +31: [2023-05-10 12:55:38,503] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 252 +11: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:38,507] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 90 +11: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt... +12: [2023-05-10 12:55:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,508] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 92 +18: [2023-05-10 12:55:38,508] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 144 +29: [2023-05-10 12:55:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +29: [2023-05-10 12:55:38,508] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 236 +22: [2023-05-10 12:55:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt... +22: [2023-05-10 12:55:38,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,512] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 90 +11: [2023-05-10 12:55:38,513] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 92 +29: [2023-05-10 12:55:38,513] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 236 + 2: [2023-05-10 12:55:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt... + 2: [2023-05-10 12:55:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt... +11: [2023-05-10 12:55:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt... +30: [2023-05-10 12:55:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +30: [2023-05-10 12:55:38,522] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 244 +30: [2023-05-10 12:55:38,529] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 244 + 2: [2023-05-10 12:55:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:38,538] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 16 +12: [2023-05-10 12:55:38,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. +12: [2023-05-10 12:55:38,539] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 98 + 2: [2023-05-10 12:55:38,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 2: [2023-05-10 12:55:38,540] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 20 +12: [2023-05-10 12:55:38,544] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 98 + 2: [2023-05-10 12:55:38,544] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 16 +26: [2023-05-10 12:55:38,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +26: [2023-05-10 12:55:38,546] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 212 + 2: [2023-05-10 12:55:38,547] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 20 + 3: [2023-05-10 12:55:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. + 3: [2023-05-10 12:55:38,550] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 30 +26: [2023-05-10 12:55:38,550] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 212 + 3: [2023-05-10 12:55:38,554] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 30 +14: [2023-05-10 12:55:38,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +14: [2023-05-10 12:55:38,556] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 116 +20: [2023-05-10 12:55:38,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:38,557] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 166 +14: [2023-05-10 12:55:38,560] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 116 +22: [2023-05-10 12:55:38,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +22: [2023-05-10 12:55:38,561] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 180 +20: [2023-05-10 12:55:38,561] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 166 +18: [2023-05-10 12:55:38,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. +18: [2023-05-10 12:55:38,566] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 150 +22: [2023-05-10 12:55:38,566] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 180 +18: [2023-05-10 12:55:38,570] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 150 + 5: [2023-05-10 12:55:38,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. + 5: [2023-05-10 12:55:38,604] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 42 + 5: [2023-05-10 12:55:38,608] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 42 + 3: [2023-05-10 12:55:38,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,618] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 29 + 3: [2023-05-10 12:55:38,622] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 29 +28: [2023-05-10 12:55:38,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:38,646] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 229 + 7: [2023-05-10 12:55:38,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,648] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 63 +28: [2023-05-10 12:55:38,651] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 229 + 7: [2023-05-10 12:55:38,653] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 63 + 7: [2023-05-10 12:55:38,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,654] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 59 + 7: [2023-05-10 12:55:38,658] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 59 +25: [2023-05-10 12:55:38,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:38,659] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 204 +18: [2023-05-10 12:55:38,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,663] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 145 +25: [2023-05-10 12:55:38,663] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 204 +21: [2023-05-10 12:55:38,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:38,666] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 171 +18: [2023-05-10 12:55:38,669] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 145 +25: [2023-05-10 12:55:38,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,669] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 203 +21: [2023-05-10 12:55:38,670] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 171 +25: [2023-05-10 12:55:38,673] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 203 +25: [2023-05-10 12:55:38,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,678] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 207 +25: [2023-05-10 12:55:38,683] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 207 + 3: [2023-05-10 12:55:38,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,690] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 31 +20: [2023-05-10 12:55:38,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +20: [2023-05-10 12:55:38,691] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 164 + 3: [2023-05-10 12:55:38,694] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 31 +20: [2023-05-10 12:55:38,695] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 164 + 5: [2023-05-10 12:55:38,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:38,710] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 45 +28: [2023-05-10 12:55:38,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:38,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 231 +15: [2023-05-10 12:55:38,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,714] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 121 + 5: [2023-05-10 12:55:38,716] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 45 +28: [2023-05-10 12:55:38,717] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 231 +15: [2023-05-10 12:55:38,718] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 121 +21: [2023-05-10 12:55:38,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:38,720] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 169 +24: [2023-05-10 12:55:38,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,723] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 195 +25: [2023-05-10 12:55:38,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +25: [2023-05-10 12:55:38,724] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 206 +21: [2023-05-10 12:55:38,724] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 169 + 4: [2023-05-10 12:55:38,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. + 4: [2023-05-10 12:55:38,727] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 32 +24: [2023-05-10 12:55:38,727] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 195 +25: [2023-05-10 12:55:38,728] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 206 +27: [2023-05-10 12:55:38,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,731] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 217 + 4: [2023-05-10 12:55:38,732] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 32 +27: [2023-05-10 12:55:38,735] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 217 +11: [2023-05-10 12:55:38,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. +11: [2023-05-10 12:55:38,737] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 88 +18: [2023-05-10 12:55:38,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,739] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 149 +11: [2023-05-10 12:55:38,741] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 88 +18: [2023-05-10 12:55:38,744] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 149 +24: [2023-05-10 12:55:38,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +24: [2023-05-10 12:55:38,746] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 194 + 7: [2023-05-10 12:55:38,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,749] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 61 +24: [2023-05-10 12:55:38,750] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 194 + 7: [2023-05-10 12:55:38,753] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 61 + 7: [2023-05-10 12:55:38,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt. + 7: [2023-05-10 12:55:38,754] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 57 + 5: [2023-05-10 12:55:38,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:38,756] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 47 + 7: [2023-05-10 12:55:38,759] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 57 + 5: [2023-05-10 12:55:38,760] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 47 + 3: [2023-05-10 12:55:38,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,763] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 27 + 3: [2023-05-10 12:55:38,768] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 27 + 3: [2023-05-10 12:55:38,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt. + 3: [2023-05-10 12:55:38,772] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 25 +24: [2023-05-10 12:55:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,775] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 197 +25: [2023-05-10 12:55:38,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,776] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 205 + 3: [2023-05-10 12:55:38,776] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 25 +18: [2023-05-10 12:55:38,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,778] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 151 +17: [2023-05-10 12:55:38,778] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 141 +24: [2023-05-10 12:55:38,779] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 197 +25: [2023-05-10 12:55:38,780] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 205 +17: [2023-05-10 12:55:38,782] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 141 +20: [2023-05-10 12:55:38,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,783] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 163 +18: [2023-05-10 12:55:38,784] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 151 +15: [2023-05-10 12:55:38,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,785] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 123 +27: [2023-05-10 12:55:38,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,786] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 223 + 6: [2023-05-10 12:55:38,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,787] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 163 + 6: [2023-05-10 12:55:38,788] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 49 +15: [2023-05-10 12:55:38,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 123 +15: [2023-05-10 12:55:38,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,790] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 223 +15: [2023-05-10 12:55:38,790] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 127 + 6: [2023-05-10 12:55:38,792] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 49 +15: [2023-05-10 12:55:38,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 127 +24: [2023-05-10 12:55:38,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,796] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 199 +21: [2023-05-10 12:55:38,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:38,800] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 175 +24: [2023-05-10 12:55:38,800] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 199 +28: [2023-05-10 12:55:38,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:38,802] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 227 +27: [2023-05-10 12:55:38,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,803] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 219 +21: [2023-05-10 12:55:38,804] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 175 +17: [2023-05-10 12:55:38,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,805] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 137 + 0: [2023-05-10 12:55:38,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. +28: [2023-05-10 12:55:38,806] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 227 + 0: [2023-05-10 12:55:38,807] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 4 + 6: [2023-05-10 12:55:38,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:55:38,807] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 53 +27: [2023-05-10 12:55:38,807] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 219 + 8: [2023-05-10 12:55:38,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:38,810] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 67 +17: [2023-05-10 12:55:38,810] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 137 + 0: [2023-05-10 12:55:38,811] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 4 + 6: [2023-05-10 12:55:38,811] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 53 + 8: [2023-05-10 12:55:38,814] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 67 +17: [2023-05-10 12:55:38,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,815] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 139 +25: [2023-05-10 12:55:38,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt. +25: [2023-05-10 12:55:38,816] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 201 +17: [2023-05-10 12:55:38,819] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 139 +25: [2023-05-10 12:55:38,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 201 +15: [2023-05-10 12:55:38,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,822] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 125 + 5: [2023-05-10 12:55:38,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:38,825] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 43 + 0: [2023-05-10 12:55:38,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt. +15: [2023-05-10 12:55:38,827] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 125 + 0: [2023-05-10 12:55:38,827] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 5 + 5: [2023-05-10 12:55:38,830] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 43 + 8: [2023-05-10 12:55:38,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:38,830] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 71 + 0: [2023-05-10 12:55:38,832] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 5 + 1: [2023-05-10 12:55:38,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,832] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 13 + 8: [2023-05-10 12:55:38,834] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 71 + 1: [2023-05-10 12:55:38,836] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 13 +13: [2023-05-10 12:55:38,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 107 +13: [2023-05-10 12:55:38,843] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 107 +28: [2023-05-10 12:55:38,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt. +28: [2023-05-10 12:55:38,844] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 225 +26: [2023-05-10 12:55:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:38,846] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 209 +21: [2023-05-10 12:55:38,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt. +27: [2023-05-10 12:55:38,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt. +21: [2023-05-10 12:55:38,847] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 173 +27: [2023-05-10 12:55:38,847] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 221 +28: [2023-05-10 12:55:38,848] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 225 + 8: [2023-05-10 12:55:38,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:38,849] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 69 +26: [2023-05-10 12:55:38,851] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 209 +21: [2023-05-10 12:55:38,852] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 173 +27: [2023-05-10 12:55:38,852] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 221 + 8: [2023-05-10 12:55:38,853] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 69 +18: [2023-05-10 12:55:38,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt. +18: [2023-05-10 12:55:38,859] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 147 +17: [2023-05-10 12:55:38,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt. +17: [2023-05-10 12:55:38,863] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 143 +26: [2023-05-10 12:55:38,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:38,864] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 213 +18: [2023-05-10 12:55:38,864] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 147 +20: [2023-05-10 12:55:38,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 167 +23: [2023-05-10 12:55:38,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 191 +17: [2023-05-10 12:55:38,868] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 143 +26: [2023-05-10 12:55:38,868] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 213 +20: [2023-05-10 12:55:38,870] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 167 +23: [2023-05-10 12:55:38,872] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 191 +14: [2023-05-10 12:55:38,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,876] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 113 +24: [2023-05-10 12:55:38,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt. +24: [2023-05-10 12:55:38,877] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 193 +22: [2023-05-10 12:55:38,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:38,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:38,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 183 +16: [2023-05-10 12:55:38,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 133 + 6: [2023-05-10 12:55:38,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:55:38,879] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 51 +14: [2023-05-10 12:55:38,881] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 113 +16: [2023-05-10 12:55:38,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 133 +24: [2023-05-10 12:55:38,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 193 + 6: [2023-05-10 12:55:38,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 51 +22: [2023-05-10 12:55:38,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 183 + 5: [2023-05-10 12:55:38,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt. + 5: [2023-05-10 12:55:38,885] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 41 + 5: [2023-05-10 12:55:38,889] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 41 +13: [2023-05-10 12:55:38,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:38,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,893] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 105 + 0: [2023-05-10 12:55:38,893] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 7 +13: [2023-05-10 12:55:38,897] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 105 + 0: [2023-05-10 12:55:38,897] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 7 + 1: [2023-05-10 12:55:38,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:38,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,903] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 9 +10: [2023-05-10 12:55:38,903] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 85 + 1: [2023-05-10 12:55:38,907] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 9 +10: [2023-05-10 12:55:38,907] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 85 + 6: [2023-05-10 12:55:38,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt. + 6: [2023-05-10 12:55:38,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 55 + 6: [2023-05-10 12:55:38,915] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 55 +19: [2023-05-10 12:55:38,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,918] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 157 +19: [2023-05-10 12:55:38,923] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 157 +20: [2023-05-10 12:55:38,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 165 +30: [2023-05-10 12:55:38,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:38,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 245 +20: [2023-05-10 12:55:38,933] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 165 +30: [2023-05-10 12:55:38,934] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 245 +29: [2023-05-10 12:55:38,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:38,936] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 237 +29: [2023-05-10 12:55:38,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 237 + 8: [2023-05-10 12:55:38,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt. + 8: [2023-05-10 12:55:38,942] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 65 +14: [2023-05-10 12:55:38,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,945] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 117 +14: [2023-05-10 12:55:38,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:38,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 115 +31: [2023-05-10 12:55:38,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:38,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 255 + 8: [2023-05-10 12:55:38,946] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 65 +26: [2023-05-10 12:55:38,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:38,947] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 215 +14: [2023-05-10 12:55:38,950] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 117 +31: [2023-05-10 12:55:38,950] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 255 +14: [2023-05-10 12:55:38,951] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 115 +26: [2023-05-10 12:55:38,951] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 215 +23: [2023-05-10 12:55:38,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,952] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 187 +12: [2023-05-10 12:55:38,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:38,955] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 97 +13: [2023-05-10 12:55:38,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,957] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 187 +13: [2023-05-10 12:55:38,958] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 109 + 9: [2023-05-10 12:55:38,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:38,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 79 +12: [2023-05-10 12:55:38,959] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 97 +22: [2023-05-10 12:55:38,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt. +22: [2023-05-10 12:55:38,961] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 179 +13: [2023-05-10 12:55:38,962] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 109 + 9: [2023-05-10 12:55:38,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 79 +12: [2023-05-10 12:55:38,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:38,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 101 +22: [2023-05-10 12:55:38,966] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 179 +19: [2023-05-10 12:55:38,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 159 +12: [2023-05-10 12:55:38,969] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 101 +11: [2023-05-10 12:55:38,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:38,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 91 +19: [2023-05-10 12:55:38,971] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 159 +23: [2023-05-10 12:55:38,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:38,974] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 185 +11: [2023-05-10 12:55:38,975] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 91 +23: [2023-05-10 12:55:38,978] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 185 + 1: [2023-05-10 12:55:38,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,981] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 11 + 1: [2023-05-10 12:55:38,985] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 11 +19: [2023-05-10 12:55:38,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,987] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 153 +20: [2023-05-10 12:55:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,989] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 161 +13: [2023-05-10 12:55:38,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt. +13: [2023-05-10 12:55:38,991] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 111 +22: [2023-05-10 12:55:38,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:38,992] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 153 +22: [2023-05-10 12:55:38,992] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 177 + 9: [2023-05-10 12:55:38,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt. +20: [2023-05-10 12:55:38,993] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 161 +12: [2023-05-10 12:55:38,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:38,993] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 75 +12: [2023-05-10 12:55:38,994] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 103 +13: [2023-05-10 12:55:38,995] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 111 +22: [2023-05-10 12:55:38,997] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 177 + 4: [2023-05-10 12:55:38,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:38,998] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 39 + 9: [2023-05-10 12:55:38,998] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 75 +12: [2023-05-10 12:55:38,998] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 103 + 1: [2023-05-10 12:55:38,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt. + 1: [2023-05-10 12:55:38,999] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 15 + 2: [2023-05-10 12:55:38,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:39,000] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 17 + 4: [2023-05-10 12:55:39,002] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 39 +19: [2023-05-10 12:55:39,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt. +19: [2023-05-10 12:55:39,003] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 155 + 1: [2023-05-10 12:55:39,003] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 15 +14: [2023-05-10 12:55:39,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt. +14: [2023-05-10 12:55:39,004] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 119 + 2: [2023-05-10 12:55:39,005] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 17 +30: [2023-05-10 12:55:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:39,005] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 243 + 9: [2023-05-10 12:55:39,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:39,006] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 73 +30: [2023-05-10 12:55:39,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:39,007] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 247 +10: [2023-05-10 12:55:39,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:39,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 87 +19: [2023-05-10 12:55:39,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 155 +14: [2023-05-10 12:55:39,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 119 +11: [2023-05-10 12:55:39,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:39,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 93 +22: [2023-05-10 12:55:39,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:39,010] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 243 +22: [2023-05-10 12:55:39,010] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 181 + 9: [2023-05-10 12:55:39,011] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 73 +16: [2023-05-10 12:55:39,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:39,011] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 131 +30: [2023-05-10 12:55:39,012] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 247 +10: [2023-05-10 12:55:39,012] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 87 +11: [2023-05-10 12:55:39,013] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 93 +22: [2023-05-10 12:55:39,015] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 181 +16: [2023-05-10 12:55:39,015] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 131 +31: [2023-05-10 12:55:39,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,015] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 249 +26: [2023-05-10 12:55:39,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt. +26: [2023-05-10 12:55:39,015] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 211 +31: [2023-05-10 12:55:39,019] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 249 +26: [2023-05-10 12:55:39,020] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 211 +31: [2023-05-10 12:55:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,027] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 251 +23: [2023-05-10 12:55:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt. +23: [2023-05-10 12:55:39,028] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 189 + 4: [2023-05-10 12:55:39,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:39,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:39,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 37 +11: [2023-05-10 12:55:39,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 95 +31: [2023-05-10 12:55:39,031] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 251 +23: [2023-05-10 12:55:39,031] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 189 +29: [2023-05-10 12:55:39,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:39,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 239 +11: [2023-05-10 12:55:39,034] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 95 + 4: [2023-05-10 12:55:39,034] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 37 +30: [2023-05-10 12:55:39,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt. +30: [2023-05-10 12:55:39,035] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 241 +29: [2023-05-10 12:55:39,037] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 239 +10: [2023-05-10 12:55:39,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:39,038] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 83 +30: [2023-05-10 12:55:39,040] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 241 +10: [2023-05-10 12:55:39,043] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 83 +29: [2023-05-10 12:55:39,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:39,046] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 233 +29: [2023-05-10 12:55:39,050] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 233 + 0: [2023-05-10 12:55:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:39,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 1 + 0: [2023-05-10 12:55:39,062] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 1 +16: [2023-05-10 12:55:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:39,064] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 129 + 4: [2023-05-10 12:55:39,064] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 33 + 2: [2023-05-10 12:55:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:39,065] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 21 +16: [2023-05-10 12:55:39,068] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 129 + 4: [2023-05-10 12:55:39,069] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 33 + 2: [2023-05-10 12:55:39,070] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 21 + 2: [2023-05-10 12:55:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:39,076] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 23 + 0: [2023-05-10 12:55:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt. + 0: [2023-05-10 12:55:39,078] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 3 + 2: [2023-05-10 12:55:39,080] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 23 + 0: [2023-05-10 12:55:39,083] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 3 +12: [2023-05-10 12:55:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt. + 9: [2023-05-10 12:55:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt. +12: [2023-05-10 12:55:39,096] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 99 + 9: [2023-05-10 12:55:39,096] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 77 +12: [2023-05-10 12:55:39,099] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 99 + 9: [2023-05-10 12:55:39,100] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 77 +10: [2023-05-10 12:55:39,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt. +10: [2023-05-10 12:55:39,101] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 81 +10: [2023-05-10 12:55:39,106] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 81 +16: [2023-05-10 12:55:39,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt. +16: [2023-05-10 12:55:39,108] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 135 +31: [2023-05-10 12:55:39,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt. +31: [2023-05-10 12:55:39,109] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 253 + 4: [2023-05-10 12:55:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt. + 4: [2023-05-10 12:55:39,110] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 35 +11: [2023-05-10 12:55:39,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt. +11: [2023-05-10 12:55:39,112] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 89 +16: [2023-05-10 12:55:39,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 135 +31: [2023-05-10 12:55:39,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 253 +29: [2023-05-10 12:55:39,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt. +29: [2023-05-10 12:55:39,114] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 235 + 4: [2023-05-10 12:55:39,114] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 35 +11: [2023-05-10 12:55:39,116] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 89 +29: [2023-05-10 12:55:39,118] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 235 + 2: [2023-05-10 12:55:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt. + 2: [2023-05-10 12:55:39,141] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 19 + 2: [2023-05-10 12:55:39,147] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 19 + 0: successfully loaded checkpoint from lm1-4b2-84b-c4-perplexity/perplexity2575 at iteration 0 +31: time (ms) | load-checkpoint: 14008.33 + 0: estimated model parameters: 2.81512448 + 0: estimated model parameters without embeddings: 2.6755328 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-05-10 12:55:40 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 102400 + 0: test: 102400 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.039954 seconds + 0: number of documents: 3133972 + 0: > dataset split: + 0: train: + 0: document indices in [0, 3133972) total of 3133972 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.082 seconds + 0: total number of samples: 731002 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.045771 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_102400ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.103 seconds + 0: total number of samples: 169955 + 0: total number of epochs: 2 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-05-10 12:55:47 + 0: done with setup ... + 0: training ... +31: time (ms) | model-and-optimizer-setup: 31696.75 | train/valid/test-data-iterators-setup: 3974.55 + 0: [after training is done] datetime: 2023-05-10 12:55:47 +31: ----------------------------------------------------------------------------------------------------------------- +31: validation loss at the end of training for val data | lm loss value: 2.612976E+00 | lm loss PPL: 1.363958E+01 | +31: ----------------------------------------------------------------------------------------------------------------- +END 3491175: Wed 10 May 2023 12:57:27 PM EEST